mirror of
https://github.com/katanemo/plano.git
synced 2026-04-25 16:56:24 +02:00
support session pinning for consistent model selection in routing (#813)
This commit is contained in:
parent
785bf7e021
commit
46a5bfd82d
8 changed files with 406 additions and 3 deletions
|
|
@ -415,6 +415,14 @@ properties:
|
|||
type: string
|
||||
model:
|
||||
type: string
|
||||
session_ttl_seconds:
|
||||
type: integer
|
||||
minimum: 1
|
||||
description: TTL in seconds for session-pinned routing cache entries. Default 600 (10 minutes).
|
||||
session_max_entries:
|
||||
type: integer
|
||||
minimum: 1
|
||||
description: Maximum number of session-pinned routing cache entries. Default 10000.
|
||||
additionalProperties: false
|
||||
state_storage:
|
||||
type: object
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue