mirror of
https://github.com/katanemo/plano.git
synced 2026-06-20 15:28:07 +02:00
73 lines
1.6 KiB
YAML
73 lines
1.6 KiB
YAML
version: v0.1
|
|
|
|
listeners:
|
|
egress_traffic:
|
|
address: 0.0.0.0
|
|
port: 12000
|
|
message_format: openai
|
|
timeout: 30s
|
|
|
|
llm_providers:
|
|
|
|
# OpenAI Models
|
|
- model: openai/gpt-5-mini-2025-08-07
|
|
access_key: $OPENAI_API_KEY
|
|
default: true
|
|
|
|
- model: openai/gpt-4o-mini
|
|
access_key: $OPENAI_API_KEY
|
|
|
|
- model: openai/o3
|
|
access_key: $OPENAI_API_KEY
|
|
|
|
- model: openai/gpt-4o
|
|
access_key: $OPENAI_API_KEY
|
|
|
|
# Anthropic Models
|
|
- model: anthropic/claude-3-5-sonnet-20241022
|
|
access_key: $ANTHROPIC_API_KEY
|
|
|
|
- model: anthropic/claude-3-haiku-20240307
|
|
access_key: $ANTHROPIC_API_KEY
|
|
|
|
# Azure OpenAI Models
|
|
- model: azure_openai/gpt-5-mini
|
|
access_key: $AZURE_API_KEY
|
|
base_url: https://katanemo.openai.azure.com
|
|
|
|
# Ollama Models
|
|
- model: ollama/llama3.1
|
|
base_url: http://host.docker.internal:11434
|
|
|
|
|
|
# Model aliases - friendly names that map to actual provider names
|
|
model_aliases:
|
|
# Alias for summarization tasks -> fast/cheap model
|
|
arch.summarize.v1:
|
|
target: gpt-5-mini-2025-08-07
|
|
|
|
# Alias for general purpose tasks -> latest model
|
|
arch.v1:
|
|
target: o3
|
|
|
|
# Alias for reasoning tasks -> capable model
|
|
arch.reasoning.v1:
|
|
target: gpt-4o
|
|
|
|
# Alias for creative tasks -> Claude model
|
|
arch.creative.v1:
|
|
target: claude-3-5-sonnet-20241022
|
|
|
|
# Alias for quick responses -> fast model
|
|
arch.fast.v1:
|
|
target: claude-3-haiku-20240307
|
|
|
|
# Semantic aliases
|
|
summary-model:
|
|
target: gpt-5-mini-2025-08-07
|
|
|
|
chat-model:
|
|
target: claude-3-5-sonnet-20241022
|
|
|
|
creative-model:
|
|
target: claude-3-5-sonnet-20241022
|