mirror of
https://github.com/katanemo/plano.git
synced 2026-05-15 11:02:39 +02:00
make arch-router cluster optional (#518)
This commit is contained in:
parent
a212dd79da
commit
147908ba7e
9 changed files with 44 additions and 30 deletions
|
|
@ -1,8 +1,5 @@
|
|||
version: v0.1.0
|
||||
|
||||
routing:
|
||||
model: arch-router
|
||||
|
||||
listeners:
|
||||
egress_traffic:
|
||||
address: 0.0.0.0
|
||||
|
|
@ -12,11 +9,6 @@ listeners:
|
|||
|
||||
llm_providers:
|
||||
|
||||
- name: arch-router
|
||||
access_key: $ARCH_API_KEY
|
||||
provider_interface: arch
|
||||
model: Arch-Router
|
||||
|
||||
- name: gpt-4o-mini
|
||||
provider_interface: openai
|
||||
access_key: $OPENAI_API_KEY
|
||||
|
|
|
|||
|
|
@ -1,7 +1,8 @@
|
|||
version: v0.1.0
|
||||
|
||||
routing:
|
||||
model: arch-router
|
||||
model: Arch-Router
|
||||
llm_provider: arch-router
|
||||
|
||||
listeners:
|
||||
egress_traffic:
|
||||
|
|
@ -13,7 +14,6 @@ listeners:
|
|||
llm_providers:
|
||||
|
||||
- name: arch-router
|
||||
access_key: $ARCH_API_KEY
|
||||
provider_interface: arch
|
||||
model: hf.co/katanemo/Arch-Router-1.5B.gguf:Q4_K_M
|
||||
endpoint: host.docker.internal:11434
|
||||
|
|
|
|||
|
|
@ -22,8 +22,8 @@ Content-Type: application/json
|
|||
|
||||
### get model list from arch-function
|
||||
GET https://archfc.katanemo.dev/v1/models HTTP/1.1
|
||||
model: arch-router
|
||||
model: Arch-Router
|
||||
|
||||
### get model list from arch-router (notice model header)
|
||||
### get model list from Arch-Router (notice model header)
|
||||
GET https://archfc.katanemo.dev/v1/models HTTP/1.1
|
||||
model: arch-router
|
||||
model: Arch-Router
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue