mirror of
https://github.com/katanemo/plano.git
synced 2026-05-04 05:12:55 +02:00
Replace RouterService/RouterModelV1 (arch-router prompt) with OrchestratorService/OrchestratorModelV1 (plano-orchestrator prompt) for LLM routing. This ensures the correct system prompt is used when llm_routing_model points at a Plano-Orchestrator model. - Extend OrchestratorService with session caching, ModelMetricsService, top-level routing preferences, and determine_route() for LLM routing - Delete RouterService, RouterModel trait, RouterModelV1, and ARCH_ROUTER_V1_SYSTEM_PROMPT - Unify defaults to Plano-Orchestrator / plano-orchestrator - Update CLI config generator, demos, docs, and config schema Made-with: Cursor
33 lines
787 B
YAML
33 lines
787 B
YAML
version: v0.3.0
|
|
|
|
overrides:
|
|
llm_routing_model: plano/Plano-Orchestrator
|
|
|
|
listeners:
|
|
- type: model
|
|
name: model_listener
|
|
port: 12000
|
|
|
|
model_providers:
|
|
|
|
- model: plano/Plano-Orchestrator
|
|
base_url: http://plano-orchestrator:10000
|
|
|
|
- model: openai/gpt-4o-mini
|
|
access_key: $OPENAI_API_KEY
|
|
default: true
|
|
|
|
- model: openai/gpt-4o
|
|
access_key: $OPENAI_API_KEY
|
|
routing_preferences:
|
|
- name: complex_reasoning
|
|
description: complex reasoning tasks, multi-step analysis, or detailed explanations
|
|
|
|
- model: anthropic/claude-sonnet-4-20250514
|
|
access_key: $ANTHROPIC_API_KEY
|
|
routing_preferences:
|
|
- name: code_generation
|
|
description: generating new code, writing functions, or creating boilerplate
|
|
|
|
tracing:
|
|
random_sampling: 100
|