mirror of
https://github.com/katanemo/plano.git
synced 2026-05-09 15:52:44 +02:00
update orchestrator model name
This commit is contained in:
parent
48bf83fa0d
commit
680dee60a0
3 changed files with 9 additions and 7 deletions
|
|
@ -141,7 +141,7 @@ vllm serve katanemo/Plano-Orchestrator-4B \
|
|||
--gpu-memory-utilization 0.3 \
|
||||
--tokenizer katanemo/Plano-Orchestrator-4B \
|
||||
--chat-template chat_template.jinja \
|
||||
--served-model-name Plano-Orchestrator \
|
||||
--served-model-name katanemo/Plano-Orchestrator-4B \
|
||||
--enable-prefix-caching
|
||||
```
|
||||
|
||||
|
|
|
|||
|
|
@ -1,7 +1,7 @@
|
|||
version: v0.3.0
|
||||
|
||||
overrides:
|
||||
orchestrator_model: plano/Plano-Orchestrator
|
||||
orchestrator_model: plano/katanemo/Plano-Orchestrator-4B
|
||||
|
||||
agents:
|
||||
- id: weather_agent
|
||||
|
|
@ -10,7 +10,7 @@ agents:
|
|||
url: http://localhost:10520
|
||||
|
||||
model_providers:
|
||||
- model: plano/Plano-Orchestrator
|
||||
- model: plano/katanemo/Plano-Orchestrator-4B
|
||||
base_url: http://localhost:8000
|
||||
|
||||
- model: openai/gpt-5.2
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue