fix(context): allow claude-code structured output

2026-06-10 08:05:14 +02:00 · 2026-05-18 19:18:58 +02:00 · 2026-05-18 19:18:58 +02:00 · cf93ee53bd
commit cf93ee53bd
parent 0ecea6e548
2 changed files with 56 additions and 6 deletions
--- a/packages/context/src/llm/claude-code-runtime.test.ts
+++ b/packages/context/src/llm/claude-code-runtime.test.ts
@ -93,7 +93,17 @@ describe('ClaudeCodeKtxLlmRuntime', () => {

  it('validates structured output with the caller schema', async () => {
    const schema = z.object({ answer: z.string() });
-    const query = vi.fn((_input: any) => stream([initMessage(), resultMessage({ structured_output: { answer: 'yes' } })]));
+    const query = vi.fn((_input: any) =>
+      stream([
+        initMessage({
+          tools: ['StructuredOutput'],
+          slash_commands: ['/help', '/compact'],
+          skills: ['pdf'],
+          agents: ['claude', 'Explore'],
+        }),
+        resultMessage({ structured_output: { answer: 'yes' } }),
+      ]),
+    );
    const runtime = new ClaudeCodeKtxLlmRuntime({
      projectDir: '/tmp/project',
      modelSlots: { default: 'sonnet' },
@ -102,10 +112,40 @@ describe('ClaudeCodeKtxLlmRuntime', () => {
    });

    await expect(runtime.generateObject({ role: 'default', prompt: 'json', schema })).resolves.toEqual({ answer: 'yes' });
+    expect(query.mock.calls[0][0].options.maxTurns).toBe(2);
    expect(query.mock.calls[0][0].options.outputFormat).toMatchObject({
      type: 'json_schema',
      schema: expect.objectContaining({ type: 'object' }),
    });
+    expect(query.mock.calls[0][0].options.allowedTools).toEqual(['StructuredOutput']);
+    expect(
+      await query.mock.calls[0][0].options.canUseTool('StructuredOutput', {}, { signal: new AbortController().signal, toolUseID: 'structured' }),
+    ).toEqual({
+      behavior: 'allow',
+      toolUseID: 'structured',
+    });
+    expect(
+      await query.mock.calls[0][0].options.canUseTool('Bash', {}, { signal: new AbortController().signal, toolUseID: 'bash' }),
+    ).toMatchObject({
+      behavior: 'deny',
+      toolUseID: 'bash',
+    });
+  });
+
+  it('rejects StructuredOutput when text generation did not request structured output', async () => {
+    const query = vi.fn((_input: any) =>
+      stream([initMessage({ tools: ['StructuredOutput'] }), resultMessage({ result: 'hello' })]),
+    );
+    const runtime = new ClaudeCodeKtxLlmRuntime({
+      projectDir: '/tmp/project',
+      modelSlots: { default: 'sonnet' },
+      query,
+      env: {},
+    });
+
+    await expect(runtime.generateText({ role: 'default', prompt: 'say hello' })).rejects.toThrow(
+      /Claude Code runtime isolation failed: tools=StructuredOutput/,
+    );
  });

  it('registers only exact KTX MCP tool ids and denies non-KTX tools', async () => {
--- a/packages/context/src/llm/claude-code-runtime.ts
+++ b/packages/context/src/llm/claude-code-runtime.ts
@ -46,6 +46,7 @@ const BUILTIN_TOOLS = [
 ];

 const KTX_MCP_SERVER_NAME = 'ktx';
+const CLAUDE_CODE_STRUCTURED_OUTPUT_TOOL_ID = 'StructuredOutput';

 function isResult(message: SDKMessage): message is SDKResultMessage {
  return message.type === 'result';
@ -83,6 +84,7 @@ function modelForRole(modelSlots: ClaudeCodeKtxLlmRuntimeDeps['modelSlots'], rol
 function assertInitIsolation(
  message: SDKMessage,
  allowedToolIds: Set<string>,
+  requiredToolIds: Set<string>,
  expectedMcpServerNames: Set<string>,
 ): void {
  if (message.type !== 'system' || message.subtype !== 'init') {
@ -90,7 +92,7 @@ function assertInitIsolation(
  }
  const activeToolIds = new Set(message.tools);
  const unexpectedTools = message.tools.filter((toolName) => !allowedToolIds.has(toolName));
-  const missingTools = [...allowedToolIds].filter((toolName) => !activeToolIds.has(toolName));
+  const missingTools = [...requiredToolIds].filter((toolName) => !activeToolIds.has(toolName));
  const activeMcpServerNames = message.mcp_servers.map((server) => server.name);
  const unexpectedMcpServers = activeMcpServerNames.filter((name) => !expectedMcpServerNames.has(name));
  const missingMcpServers = [...expectedMcpServerNames].filter((name) => !activeMcpServerNames.includes(name));
@ -131,8 +133,9 @@ function baseOptions(input: {
  env: NodeJS.ProcessEnv | undefined;
  maxTurns: number;
  tools?: KtxRuntimeToolSet;
+  internalAllowedToolIds?: string[];
 }): Options {
-  const toolIds = mcpToolIds(input.tools ?? {});
+  const toolIds = [...mcpToolIds(input.tools ?? {}), ...(input.internalAllowedToolIds ?? [])];
  const allowedToolIds = new Set(toolIds);
  const expectedServerNames = [...expectedMcpServerNames(input.tools)];
  return {
@ -176,12 +179,13 @@ async function collectResult(params: {
  prompt: string;
  options: Options;
  allowedToolIds: Set<string>;
+  requiredToolIds?: Set<string>;
  expectedMcpServerNames: Set<string>;
  onAssistantTurn?: () => Promise<void>;
 }): Promise<SDKResultMessage> {
  let result: SDKResultMessage | undefined;
  for await (const message of params.query({ prompt: params.prompt, options: params.options })) {
-    assertInitIsolation(message, params.allowedToolIds, params.expectedMcpServerNames);
+    assertInitIsolation(message, params.allowedToolIds, params.requiredToolIds ?? params.allowedToolIds, params.expectedMcpServerNames);
    if (message.type === 'assistant' && message.parent_tool_use_id === null) {
      await params.onAssistantTurn?.();
    }
@ -217,6 +221,7 @@ export class ClaudeCodeKtxLlmRuntime implements KtxLlmRuntimePort {
      prompt: [input.system, input.prompt].filter(Boolean).join('\n\n'),
      options,
      allowedToolIds: new Set(mcpToolIds(input.tools ?? {})),
+      requiredToolIds: new Set(mcpToolIds(input.tools ?? {})),
      expectedMcpServerNames: expectedMcpServerNames(input.tools),
    });
    const error = resultError(result);
@ -237,16 +242,19 @@ export class ClaudeCodeKtxLlmRuntime implements KtxLlmRuntimePort {
        projectDir: this.deps.projectDir,
        model: modelForRole(this.deps.modelSlots, input.role),
        env: this.deps.env,
-        maxTurns: 1,
+        maxTurns: 2,
        tools: input.tools,
+        internalAllowedToolIds: [CLAUDE_CODE_STRUCTURED_OUTPUT_TOOL_ID],
      }),
      outputFormat: { type: 'json_schema' as const, schema: jsonSchema(input.schema as z.ZodType) },
    };
+    const allowedToolIds = new Set([...mcpToolIds(input.tools ?? {}), CLAUDE_CODE_STRUCTURED_OUTPUT_TOOL_ID]);
    const result = await collectResult({
      query: this.runQuery,
      prompt: [input.system, input.prompt].filter(Boolean).join('\n\n'),
      options,
-      allowedToolIds: new Set(mcpToolIds(input.tools ?? {})),
+      allowedToolIds,
+      requiredToolIds: new Set(mcpToolIds(input.tools ?? {})),
      expectedMcpServerNames: expectedMcpServerNames(input.tools),
    });
    const error = resultError(result);
@ -274,6 +282,7 @@ export class ClaudeCodeKtxLlmRuntime implements KtxLlmRuntimePort {
        prompt: params.userPrompt,
        options: { ...options, systemPrompt: params.systemPrompt },
        allowedToolIds: new Set(mcpToolIds(params.toolSet)),
+        requiredToolIds: new Set(mcpToolIds(params.toolSet)),
        expectedMcpServerNames: expectedMcpServerNames(params.toolSet),
        onAssistantTurn: async () => {
          stepIndex += 1;
@ -329,6 +338,7 @@ export async function runClaudeCodeAuthProbe(input: {
      prompt: 'Reply with exactly: ok',
      options,
      allowedToolIds: new Set(),
+      requiredToolIds: new Set(),
      expectedMcpServerNames: new Set(),
    });
    const error = resultError(result);