version: v0.1 listeners: egress_traffic: address: 0.0.0.0 port: 12000 message_format: openai timeout: 30s llm_providers: # OpenAI Models - model: openai/gpt-5-mini-2025-08-07 access_key: $OPENAI_API_KEY default: true - model: openai/gpt-4o-mini access_key: $OPENAI_API_KEY - model: openai/o3 access_key: $OPENAI_API_KEY - model: openai/gpt-4o access_key: $OPENAI_API_KEY # Anthropic Models - model: anthropic/claude-3-5-sonnet-20241022 access_key: $ANTHROPIC_API_KEY - model: anthropic/claude-3-haiku-20240307 access_key: $ANTHROPIC_API_KEY # Azure OpenAI Models - model: azure_openai/gpt-5-mini access_key: $AZURE_API_KEY base_url: https://katanemo.openai.azure.com # Ollama Models - model: ollama/llama3.1 base_url: http://host.docker.internal:11434 # Model aliases - friendly names that map to actual provider names model_aliases: # Alias for summarization tasks -> fast/cheap model arch.summarize.v1: target: gpt-5-mini-2025-08-07 # Alias for general purpose tasks -> latest model arch.v1: target: o3 # Alias for reasoning tasks -> capable model arch.reasoning.v1: target: gpt-4o # Alias for creative tasks -> Claude model arch.creative.v1: target: claude-3-5-sonnet-20241022 # Alias for quick responses -> fast model arch.fast.v1: target: claude-3-haiku-20240307 # Semantic aliases summary-model: target: gpt-5-mini-2025-08-07 chat-model: target: claude-3-5-sonnet-20241022 creative-model: target: claude-3-5-sonnet-20241022