Adding support for wildcard models in the model_providers config (#696)

* cleaning up plano cli commands * adding support for wildcard model providers * fixing compile errors * fixing bugs related to default model provider, provider hint and duplicates in the model provider list * fixed cargo fmt issues * updating tests to always include the model id * using default for the prompt_gateway path * fixed the model name, as gpt-5-mini-2025-08-07 wasn't in the config * making sure that all aliases and models match the config * fixed the config generator to allow for base_url providers LLMs to include wildcard models * re-ran the models list utility and added a shell script to run it * updating docs to mention wildcard model providers * updated provider_models.json to yaml, added that file to our docs for reference * updating the build docs to use the new root-based build --------- Co-authored-by: Salman Paracha <salmanparacha@MacBook-Pro-342.local>
2026-07-23 16:51:04 +02:00 · 2026-01-28 17:47:33 -08:00 · 2026-01-28 17:47:33 -08:00 · 2941392ed1
commit 2941392ed1
parent 8428b06e22
42 changed files with 1748 additions and 202 deletions
--- a/demos/samples_java/weather_forcecast_service/run_demo.sh
+++ b/demos/samples_java/weather_forcecast_service/run_demo.sh
@ -18,8 +18,8 @@ start_demo() {
    echo ".env file created with OPENAI_API_KEY."
  fi

-  # Step 3: Start Arch
-  echo "Starting Arch with config.yaml..."
+  # Step 3: Start Plano
+  echo "Starting Plano with config.yaml..."
  planoai up config.yaml

  # Step 4: Start developer services
@ -33,8 +33,8 @@ stop_demo() {
  echo "Stopping Network Agent using Docker Compose..."
  docker compose down

-  # Step 2: Stop Arch
-  echo "Stopping Arch..."
+  # Step 2: Stop Plano
+  echo "Stopping Plano..."
  planoai down
 }

--- a/demos/samples_python/currency_exchange/hurl_tests/simple.hurl
+++ b/demos/samples_python/currency_exchange/hurl_tests/simple.hurl
@ -8,7 +8,7 @@ Content-Type: application/json
      "content": "convert 100 eur"
    }
  ],
-  "model": "none"
+  "model": "gpt-4o"
 }
 HTTP 200
 [Asserts]
--- a/demos/samples_python/currency_exchange/hurl_tests/simple_stream.hurl
+++ b/demos/samples_python/currency_exchange/hurl_tests/simple_stream.hurl
@ -9,7 +9,7 @@ Content-Type: application/json
    }
  ],
  "stream": true,
-  "model": "none"
+  "model": "gpt-4o"
 }
 HTTP 200
 [Asserts]
--- a/demos/samples_python/currency_exchange/run_demo.sh
+++ b/demos/samples_python/currency_exchange/run_demo.sh
@ -18,8 +18,8 @@ start_demo() {
    echo ".env file created with OPENAI_API_KEY."
  fi

-  # Step 3: Start Arch
-  echo "Starting Arch with config.yaml..."
+  # Step 3: Start Plano
+  echo "Starting Plano with config.yaml..."
  planoai up config.yaml

  # Step 4: Start developer services
@ -33,8 +33,8 @@ stop_demo() {
  echo "Stopping Network Agent using Docker Compose..."
  docker compose down

-  # Step 2: Stop Arch
-  echo "Stopping Arch..."
+  # Step 2: Stop Plano
+  echo "Stopping Plano..."
  planoai down
 }

--- a/demos/use_cases/README.md
+++ b/demos/use_cases/README.md
@ -67,7 +67,7 @@ print("OpenAI Response:", response.choices[0].message.content)
 #### Step 3.2: Using curl command
 ```
 $ curl --header 'Content-Type: application/json' \
-  --data '{"messages": [{"role": "user","content": "What is the capital of France?"}], "model": "none"}' \
+  --data '{"messages": [{"role": "user","content": "What is the capital of France?"}], "model": "gpt-4o"}' \
  http://localhost:12000/v1/chat/completions

 {
@ -92,7 +92,7 @@ You can override model selection using `x-arch-llm-provider-hint` header. For ex
 ```
 $ curl --header 'Content-Type: application/json' \
  --header 'x-arch-llm-provider-hint: ministral-3b' \
-  --data '{"messages": [{"role": "user","content": "What is the capital of France?"}], "model": "none"}' \
+  --data '{"messages": [{"role": "user","content": "What is the capital of France?"}], "model": "gpt-4o"}' \
  http://localhost:12000/v1/chat/completions
 {
  ...
--- a/demos/use_cases/llm_routing/README.md
+++ b/demos/use_cases/llm_routing/README.md
@ -19,7 +19,7 @@ You can also pass in a header to override model when sending prompt. Following e

 $ curl --header 'Content-Type: application/json' \
  --header 'x-arch-llm-provider-hint: mistral/ministral-3b' \
-  --data '{"messages": [{"role": "user","content": "hello"}], "model": "none"}' \
+  --data '{"messages": [{"role": "user","content": "hello"}], "model": "gpt-4o"}' \
  http://localhost:12000/v1/chat/completions 2> /dev/null | jq .
 {
  "id": "xxx",
--- a/demos/use_cases/model_alias_routing/config_with_aliases.yaml
+++ b/demos/use_cases/model_alias_routing/config_with_aliases.yaml
@ -23,7 +23,13 @@ llm_providers:
  - model: openai/gpt-4o
    access_key: $OPENAI_API_KEY

-  # Anthropic Models
+  - model: openai/*
+    access_key: $OPENAI_API_KEY
+
+  # Anthropic - support all Claude models
+  - model: anthropic/*
+    access_key: $ANTHROPIC_API_KEY
+
  - model: anthropic/claude-sonnet-4-20250514
    access_key: $ANTHROPIC_API_KEY

--- a/demos/use_cases/preference_based_routing/hurl_tests/simple_stream.hurl
+++ b/demos/use_cases/preference_based_routing/hurl_tests/simple_stream.hurl
@ -5,13 +5,13 @@ Content-Type: application/json
  "messages": [
    {
      "role": "user",
-      "content": "hi"
+      "content": "Can you explain what this Python function does?\n\ndef fibonacci(n):\n    if n <= 1:\n        return n\n    return fibonacci(n-1) + fibonacci(n-2)"
    }
  ],
-  "model": "none",
+  "model": "openai/gpt-4o-mini",
  "stream": true
 }
 HTTP 200
 [Asserts]
 header "content-type" matches /text\/event-stream/
-body matches /^data: .*?gpt-4o-mini.*?\n/
+body matches /^data: .*?gpt-4o.*?\n/
--- a/demos/use_cases/preference_based_routing/test_router_endpoint.rest
+++ b/demos/use_cases/preference_based_routing/test_router_endpoint.rest
@ -34,7 +34,7 @@ POST http://localhost:12000/v1/chat/completions HTTP/1.1
 Content-Type: application/json

 {
-  "model": "none",
+  "model": "gpt-4o",
  "messages": [
    {
      "role": "user",
@ -49,7 +49,7 @@ POST http://localhost:12000/v1/chat/completions HTTP/1.1
 Content-Type: application/json

 {
-  "model": "none",
+  "model": "gpt-4o",
  "messages": [
    {
      "role": "user",