plano/demos/use_cases/preference_based_routing/arch_config.yaml

40 lines
869 B
YAML
Raw Permalink Normal View History

2025-05-08 14:07:23 -07:00
version: "0.1-beta"
2025-05-12 12:55:59 -07:00
routing:
2025-05-14 11:52:25 -07:00
model: archgw-v1-router-model
2025-05-08 14:07:23 -07:00
listeners:
egress_traffic:
address: 0.0.0.0
port: 12000
message_format: openai
timeout: 30s
llm_providers:
2025-05-14 11:52:25 -07:00
- name: archgw-v1-router-model
provider_interface: openai
model: cotran2/llama-1b-4-26
base_url: http://35.192.87.187:8000/v1
- name: gpt-4o-mini
provider_interface: openai
access_key: $OPENAI_API_KEY
model: gpt-4o-mini
default: true
2025-05-08 14:07:23 -07:00
- name: gpt-4o
provider_interface: openai
access_key: $OPENAI_API_KEY
model: gpt-4o
2025-05-14 11:52:25 -07:00
usage: Generating original content such as scripts, articles, or creative materials.
2025-05-08 14:07:23 -07:00
- name: o4-mini
provider_interface: openai
access_key: $OPENAI_API_KEY
model: o4-mini
2025-05-14 11:52:25 -07:00
usage: Requesting topic ideas specifically related to personal finance and budgeting.
2025-05-08 14:07:23 -07:00
tracing:
random_sampling: 100