local support for Arch-Router via Ollama

This commit is contained in:
Salman Paracha 2025-06-20 17:12:12 -07:00
parent 1bbd35f1ab
commit 85d59e20ec
2 changed files with 46 additions and 0 deletions

View file

@ -144,6 +144,7 @@ impl RouterModel for RouterModelV1 {
content: Some(ContentType::Text(messages_content)),
role: USER_ROLE.to_string(),
}],
temperature: Some(0.01),
..Default::default()
}
}

View file

@ -0,0 +1,45 @@
version: v0.1.0
routing:
model: arch-router
listeners:
egress_traffic:
address: 0.0.0.0
port: 12000
message_format: openai
timeout: 30s
llm_providers:
- name: arch-router
access_key: $ARCH_API_KEY
provider_interface: arch
model: hf.co/katanemo/Arch-Router-1.5B.gguf:Q4_K_M
endpoint: host.docker.internal:11434
- name: gpt-4o-mini
provider_interface: openai
access_key: $OPENAI_API_KEY
model: gpt-4o-mini
- name: gpt-4.1
provider_interface: openai
access_key: $OPENAI_API_KEY
model: gpt-4.1
default: true
- name: code_generation
access_key: $OPENAI_API_KEY
provider_interface: openai
model: gpt-4.1
usage: generating new code snippets, functions, or boilerplate based on user prompts or requirements
- name: code_understanding
provider_interface: openai
access_key: $OPENAI_API_KEY
model: gpt-4.1
usage: understand and explain existing code snippets, functions, or libraries
tracing:
random_sampling: 100