mirror of
https://github.com/katanemo/plano.git
synced 2026-05-09 07:42:43 +02:00
rename session pinning to model affinity with x-model-affinity header
This commit is contained in:
parent
5789694d2f
commit
da9792c2dd
14 changed files with 468 additions and 371 deletions
|
|
@ -114,7 +114,7 @@ echo "--- 7. Session pinning - first call (fresh routing decision) ---"
|
|||
echo ""
|
||||
curl -s "$PLANO_URL/routing/v1/chat/completions" \
|
||||
-H "Content-Type: application/json" \
|
||||
-H "X-Routing-Session-Id: demo-session-001" \
|
||||
-H "X-Model-Affinity: demo-session-001" \
|
||||
-d '{
|
||||
"model": "gpt-4o-mini",
|
||||
"messages": [
|
||||
|
|
@ -129,7 +129,7 @@ echo " Notice: same model returned with \"pinned\": true, routing was skipped
|
|||
echo ""
|
||||
curl -s "$PLANO_URL/routing/v1/chat/completions" \
|
||||
-H "Content-Type: application/json" \
|
||||
-H "X-Routing-Session-Id: demo-session-001" \
|
||||
-H "X-Model-Affinity: demo-session-001" \
|
||||
-d '{
|
||||
"model": "gpt-4o-mini",
|
||||
"messages": [
|
||||
|
|
@ -143,7 +143,7 @@ echo "--- 9. Different session gets its own fresh routing ---"
|
|||
echo ""
|
||||
curl -s "$PLANO_URL/routing/v1/chat/completions" \
|
||||
-H "Content-Type: application/json" \
|
||||
-H "X-Routing-Session-Id: demo-session-002" \
|
||||
-H "X-Model-Affinity: demo-session-002" \
|
||||
-d '{
|
||||
"model": "gpt-4o-mini",
|
||||
"messages": [
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue