plano/demos/use_cases/llm_routing/arch_config.yaml
2025-05-28 19:08:00 -07:00

49 lines
996 B
YAML

version: "0.1-beta"
listeners:
egress_traffic:
address: 0.0.0.0
port: 12000
message_format: openai
timeout: 30s
llm_providers:
- name: gpt-4o-mini
access_key: $OPENAI_API_KEY
provider_interface: openai
model: gpt-4o-mini
- name: gpt-4o
access_key: $OPENAI_API_KEY
provider_interface: openai
model: gpt-4o
default: true
- name: ministral-3b
access_key: $MISTRAL_API_KEY
provider_interface: mistral
model: ministral-3b-latest
- name: claude-sonnet
access_key: $ANTHROPY_API_KEY
provider_interface: claude
model: claude-3-7-sonnet-latest
- name: claude-sonnet-4
access_key: $ANTHROPY_API_KEY
provider_interface: claude
model: claude-sonnet-4-0
- name: deepseek
access_key: $DEEPSEEK_API_KEY
provider_interface: deepseek
model: deepseek-reasoner
- name: groq
access_key: $GROQ_API_KEY
provider_interface: groq
model: llama-3.1-8b-instant
tracing:
random_sampling: 100