Overhaul demos directory: cleanup, restructure, and standardize configs (#760)

2026-04-25 00:36:34 +02:00 · 2026-02-17 03:09:28 -08:00 · 2026-02-17 03:09:28 -08:00 · 473996d35d
commit 473996d35d
parent c3591bcbf3
205 changed files with 304 additions and 5223 deletions
--- a/demos/samples_python/currency_exchange/README.md
+++ b/demos/samples_python/currency_exchange/README.md
--- a/demos/samples_python/currency_exchange/config.yaml
+++ b/demos/samples_python/currency_exchange/config.yaml
@ -1,13 +1,11 @@
-version: v0.1.0
+version: v0.3.0

 listeners:
-  ingress_traffic:
-    address: 0.0.0.0
+  - type: prompt
+    name: prompt_listener
    port: 10000
-    message_format: openai
-    timeout: 30s

-llm_providers:
+model_providers:
  - model: openai/gpt-4o-mini
    access_key: $OPENAI_API_KEY
    default: true
--- a/demos/advanced/currency_exchange/docker-compose.yaml
+++ b/demos/advanced/currency_exchange/docker-compose.yaml
@ -0,0 +1,25 @@
+services:
+  anythingllm:
+    image: mintplexlabs/anythingllm
+    restart: always
+    ports:
+      - "3001:3001"
+    cap_add:
+      - SYS_ADMIN
+    environment:
+      - STORAGE_DIR=/app/server/storage
+      - LLM_PROVIDER=generic-openai
+      - GENERIC_OPEN_AI_BASE_PATH=http://host.docker.internal:10000/v1
+      - GENERIC_OPEN_AI_MODEL_PREF=gpt-4o-mini
+      - GENERIC_OPEN_AI_MODEL_TOKEN_LIMIT=128000
+      - GENERIC_OPEN_AI_API_KEY=sk-placeholder
+    extra_hosts:
+      - "host.docker.internal:host-gateway"
+
+  jaeger:
+    build:
+      context: ../../shared/jaeger
+    ports:
+      - "16686:16686"
+      - "4317:4317"
+      - "4318:4318"
--- a/demos/samples_python/currency_exchange/hurl_tests/simple.hurl
+++ b/demos/samples_python/currency_exchange/hurl_tests/simple.hurl
--- a/demos/samples_python/currency_exchange/hurl_tests/simple_stream.hurl
+++ b/demos/samples_python/currency_exchange/hurl_tests/simple_stream.hurl
--- a/demos/samples_java/weather_forcecast_service/run_demo.sh
+++ b/demos/samples_java/weather_forcecast_service/run_demo.sh
--- a/demos/samples_python/currency_exchange/test_data.yaml
+++ b/demos/samples_python/currency_exchange/test_data.yaml
--- a/demos/use_cases/model_choice_with_test_harness/README.md
+++ b/demos/use_cases/model_choice_with_test_harness/README.md
--- a/demos/use_cases/model_choice_with_test_harness/bench.py
+++ b/demos/use_cases/model_choice_with_test_harness/bench.py
--- a/demos/use_cases/model_choice_with_test_harness/evals_summarize.yaml
+++ b/demos/use_cases/model_choice_with_test_harness/evals_summarize.yaml
--- a/demos/use_cases/model_choice_with_test_harness/plano_config_with_aliases.yaml
+++ b/demos/use_cases/model_choice_with_test_harness/plano_config_with_aliases.yaml
@ -1,13 +1,11 @@
-version: v0.1.0
+version: v0.3.0

 listeners:
-  egress_traffic:
-    address: 0.0.0.0
+  - type: model
+    name: model_listener
    port: 12000
-    message_format: openai
-    timeout: 30s

-llm_providers:
+model_providers:
  - model: openai/gpt-4o-mini
    access_key: $OPENAI_API_KEY
    default: true
@ -20,3 +18,6 @@ model_aliases:
    target: gpt-4o-mini
  arch.reason.v1:
    target: o3
+
+tracing:
+  random_sampling: 100
--- a/demos/use_cases/model_choice_with_test_harness/pyproject.toml
+++ b/demos/use_cases/model_choice_with_test_harness/pyproject.toml
--- a/demos/use_cases/model_choice_with_test_harness/run_demo.sh
+++ b/demos/use_cases/model_choice_with_test_harness/run_demo.sh
--- a/demos/use_cases/model_choice_with_test_harness/uv.lock
+++ b/demos/use_cases/model_choice_with_test_harness/uv.lock
--- a/demos/samples_python/multi_turn_rag_agent/Dockerfile
+++ b/demos/samples_python/multi_turn_rag_agent/Dockerfile
--- a/demos/samples_python/multi_turn_rag_agent/README.md
+++ b/demos/samples_python/multi_turn_rag_agent/README.md
--- a/demos/samples_python/multi_turn_rag_agent/config.yaml
+++ b/demos/samples_python/multi_turn_rag_agent/config.yaml
@ -1,18 +1,16 @@
-version: v0.1.0
+version: v0.3.0

 listeners:
-  ingress_traffic:
-    address: 0.0.0.0
+  - type: prompt
+    name: prompt_listener
    port: 10000
-    message_format: openai
-    timeout: 30s

 endpoints:
  rag_energy_source_agent:
    endpoint: host.docker.internal:18083
    connect_timeout: 0.005s

-llm_providers:
+model_providers:
  - access_key: $OPENAI_API_KEY
    model: openai/gpt-4o-mini
    default: true
--- a/demos/advanced/multi_turn_rag/docker-compose.yaml
+++ b/demos/advanced/multi_turn_rag/docker-compose.yaml
@ -0,0 +1,28 @@
+services:
+  rag_energy_source_agent:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    ports:
+      - "18083:80"
+    healthcheck:
+        test: ["CMD", "curl" ,"http://localhost:80/healthz"]
+        interval: 5s
+        retries: 20
+
+  anythingllm:
+    image: mintplexlabs/anythingllm
+    restart: always
+    ports:
+      - "3001:3001"
+    cap_add:
+      - SYS_ADMIN
+    environment:
+      - STORAGE_DIR=/app/server/storage
+      - LLM_PROVIDER=generic-openai
+      - GENERIC_OPEN_AI_BASE_PATH=http://host.docker.internal:10000/v1
+      - GENERIC_OPEN_AI_MODEL_PREF=gpt-4o-mini
+      - GENERIC_OPEN_AI_MODEL_TOKEN_LIMIT=128000
+      - GENERIC_OPEN_AI_API_KEY=sk-placeholder
+    extra_hosts:
+      - "host.docker.internal:host-gateway"
--- a/demos/samples_python/multi_turn_rag_agent/main.py
+++ b/demos/samples_python/multi_turn_rag_agent/main.py
--- a/demos/samples_python/multi_turn_rag_agent/mutli-turn-example.png
+++ b/demos/samples_python/multi_turn_rag_agent/mutli-turn-example.png
--- a/demos/samples_python/multi_turn_rag_agent/requirements.txt
+++ b/demos/samples_python/multi_turn_rag_agent/requirements.txt
--- a/demos/samples_python/multi_turn_rag_agent/run_demo.sh
+++ b/demos/samples_python/multi_turn_rag_agent/run_demo.sh
--- a/demos/samples_python/stock_quote/README.md
+++ b/demos/samples_python/stock_quote/README.md
--- a/demos/samples_python/stock_quote/config.yaml
+++ b/demos/samples_python/stock_quote/config.yaml
@ -1,13 +1,11 @@
-version: v0.1.0
+version: v0.3.0

 listeners:
-  ingress_traffic:
-    address: 0.0.0.0
+  - type: prompt
+    name: prompt_listener
    port: 10000
-    message_format: openai
-    timeout: 30s

-llm_providers:
+model_providers:
  - access_key: $OPENAI_API_KEY
    model: openai/gpt-4o

--- a/demos/advanced/stock_quote/docker-compose.yaml
+++ b/demos/advanced/stock_quote/docker-compose.yaml
@ -0,0 +1,25 @@
+services:
+  anythingllm:
+    image: mintplexlabs/anythingllm
+    restart: always
+    ports:
+      - "3001:3001"
+    cap_add:
+      - SYS_ADMIN
+    environment:
+      - STORAGE_DIR=/app/server/storage
+      - LLM_PROVIDER=generic-openai
+      - GENERIC_OPEN_AI_BASE_PATH=http://host.docker.internal:10000/v1
+      - GENERIC_OPEN_AI_MODEL_PREF=gpt-4o-mini
+      - GENERIC_OPEN_AI_MODEL_TOKEN_LIMIT=128000
+      - GENERIC_OPEN_AI_API_KEY=sk-placeholder
+    extra_hosts:
+      - "host.docker.internal:host-gateway"
+
+  jaeger:
+    build:
+      context: ../../shared/jaeger
+    ports:
+      - "16686:16686"
+      - "4317:4317"
+      - "4318:4318"
--- a/demos/samples_python/currency_exchange/run_demo.sh
+++ b/demos/samples_python/currency_exchange/run_demo.sh
--- a/demos/samples_python/stock_quote/stock_quote_demo.png
+++ b/demos/samples_python/stock_quote/stock_quote_demo.png
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/Dockerfile
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/Dockerfile
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/README.md
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/README.md
@ -37,7 +37,7 @@ Plano acts as a **framework-agnostic proxy and data plane** that:

 ```bash
 # From the demo directory
-cd demos/use_cases/multi_agent_with_crewai_langchain
+cd demos/agent_orchestration/multi_agent_crewai_langchain

 # Build and start all services
 docker-compose up -d
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/config.yaml
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/config.yaml
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/crewai/flight_agent.py
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/crewai/flight_agent.py
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/docker-compose.yaml
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/docker-compose.yaml
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/langchain/weather_agent.py
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/langchain/weather_agent.py
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/openai_protocol.py
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/openai_protocol.py
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/pyproject.toml
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/pyproject.toml
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/traces.png
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/traces.png
--- a/demos/agent_orchestration/multi_agent_crewai_langchain/uv.lock
+++ b/demos/agent_orchestration/multi_agent_crewai_langchain/uv.lock
--- a/demos/agent_orchestration/travel_agents/Dockerfile
+++ b/demos/agent_orchestration/travel_agents/Dockerfile
--- a/demos/agent_orchestration/travel_agents/README.md
+++ b/demos/agent_orchestration/travel_agents/README.md
--- a/demos/agent_orchestration/travel_agents/config.yaml
+++ b/demos/agent_orchestration/travel_agents/config.yaml
--- a/demos/agent_orchestration/travel_agents/docker-compose.yaml
+++ b/demos/agent_orchestration/travel_agents/docker-compose.yaml
--- a/demos/agent_orchestration/travel_agents/pyproject.toml
+++ b/demos/agent_orchestration/travel_agents/pyproject.toml
--- a/demos/agent_orchestration/travel_agents/src/travel_agents/flight_agent.py
+++ b/demos/agent_orchestration/travel_agents/src/travel_agents/flight_agent.py
--- a/demos/agent_orchestration/travel_agents/src/travel_agents/weather_agent.py
+++ b/demos/agent_orchestration/travel_agents/src/travel_agents/weather_agent.py
--- a/demos/agent_orchestration/travel_agents/test.rest
+++ b/demos/agent_orchestration/travel_agents/test.rest
--- a/demos/agent_orchestration/travel_agents/tracing.png
+++ b/demos/agent_orchestration/travel_agents/tracing.png
--- a/demos/agent_orchestration/travel_agents/travel_agent_request.rest
+++ b/demos/agent_orchestration/travel_agents/travel_agent_request.rest
--- a/demos/agent_orchestration/travel_agents/uv.lock
+++ b/demos/agent_orchestration/travel_agents/uv.lock
--- a/demos/filter_chains/http_filter/Dockerfile
+++ b/demos/filter_chains/http_filter/Dockerfile
--- a/demos/filter_chains/http_filter/README.md
+++ b/demos/filter_chains/http_filter/README.md
--- a/demos/filter_chains/http_filter/config.yaml
+++ b/demos/filter_chains/http_filter/config.yaml
--- a/demos/filter_chains/http_filter/docker-compose.yaml
+++ b/demos/filter_chains/http_filter/docker-compose.yaml
--- a/demos/filter_chains/http_filter/http.rest
+++ b/demos/filter_chains/http_filter/http.rest
--- a/demos/filter_chains/http_filter/mcp_query.rest
+++ b/demos/filter_chains/http_filter/mcp_query.rest
--- a/demos/filter_chains/http_filter/pyproject.toml
+++ b/demos/filter_chains/http_filter/pyproject.toml
--- a/demos/filter_chains/http_filter/sample_queries.md
+++ b/demos/filter_chains/http_filter/sample_queries.md
--- a/demos/filter_chains/http_filter/src/rag_agent/init.py
+++ b/demos/filter_chains/http_filter/src/rag_agent/init.py
--- a/demos/filter_chains/http_filter/src/rag_agent/main.py
+++ b/demos/filter_chains/http_filter/src/rag_agent/main.py
--- a/demos/filter_chains/http_filter/src/rag_agent/api.py
+++ b/demos/filter_chains/http_filter/src/rag_agent/api.py
--- a/demos/filter_chains/http_filter/src/rag_agent/context_builder.py
+++ b/demos/filter_chains/http_filter/src/rag_agent/context_builder.py
--- a/demos/filter_chains/http_filter/src/rag_agent/input_guards.py
+++ b/demos/filter_chains/http_filter/src/rag_agent/input_guards.py
--- a/demos/filter_chains/http_filter/src/rag_agent/query_rewriter.py
+++ b/demos/filter_chains/http_filter/src/rag_agent/query_rewriter.py
--- a/demos/filter_chains/http_filter/src/rag_agent/rag_agent.py
+++ b/demos/filter_chains/http_filter/src/rag_agent/rag_agent.py
--- a/demos/filter_chains/http_filter/src/rag_agent/sample_knowledge_base.csv
+++ b/demos/filter_chains/http_filter/src/rag_agent/sample_knowledge_base.csv
--- a/demos/filter_chains/http_filter/start_agents.sh
+++ b/demos/filter_chains/http_filter/start_agents.sh
--- a/demos/filter_chains/http_filter/test.rest
+++ b/demos/filter_chains/http_filter/test.rest
--- a/demos/filter_chains/http_filter/uv.lock
+++ b/demos/filter_chains/http_filter/uv.lock
--- a/demos/filter_chains/mcp_filter/Dockerfile
+++ b/demos/filter_chains/mcp_filter/Dockerfile
--- a/demos/filter_chains/mcp_filter/README.md
+++ b/demos/filter_chains/mcp_filter/README.md
--- a/demos/filter_chains/mcp_filter/config.yaml
+++ b/demos/filter_chains/mcp_filter/config.yaml
--- a/demos/filter_chains/mcp_filter/docker-compose.yaml
+++ b/demos/filter_chains/mcp_filter/docker-compose.yaml
--- a/demos/filter_chains/mcp_filter/mcp_query.rest
+++ b/demos/filter_chains/mcp_filter/mcp_query.rest
--- a/demos/filter_chains/mcp_filter/pyproject.toml
+++ b/demos/filter_chains/mcp_filter/pyproject.toml
--- a/demos/filter_chains/mcp_filter/sample_queries.md
+++ b/demos/filter_chains/mcp_filter/sample_queries.md
--- a/demos/filter_chains/mcp_filter/src/rag_agent/init.py
+++ b/demos/filter_chains/mcp_filter/src/rag_agent/init.py
--- a/demos/filter_chains/mcp_filter/src/rag_agent/main.py
+++ b/demos/filter_chains/mcp_filter/src/rag_agent/main.py
--- a/demos/filter_chains/mcp_filter/src/rag_agent/api.py
+++ b/demos/filter_chains/mcp_filter/src/rag_agent/api.py
--- a/demos/filter_chains/mcp_filter/src/rag_agent/context_builder.py
+++ b/demos/filter_chains/mcp_filter/src/rag_agent/context_builder.py
--- a/demos/filter_chains/mcp_filter/src/rag_agent/input_guards.py
+++ b/demos/filter_chains/mcp_filter/src/rag_agent/input_guards.py
--- a/demos/filter_chains/mcp_filter/src/rag_agent/query_rewriter.py
+++ b/demos/filter_chains/mcp_filter/src/rag_agent/query_rewriter.py
--- a/demos/filter_chains/mcp_filter/src/rag_agent/rag_agent.py
+++ b/demos/filter_chains/mcp_filter/src/rag_agent/rag_agent.py
--- a/demos/filter_chains/mcp_filter/src/rag_agent/sample_knowledge_base.csv
+++ b/demos/filter_chains/mcp_filter/src/rag_agent/sample_knowledge_base.csv
--- a/demos/filter_chains/mcp_filter/start_agents.sh
+++ b/demos/filter_chains/mcp_filter/start_agents.sh
--- a/demos/filter_chains/mcp_filter/test.rest
+++ b/demos/filter_chains/mcp_filter/test.rest
--- a/demos/filter_chains/mcp_filter/uv.lock
+++ b/demos/filter_chains/mcp_filter/uv.lock
--- a/demos/getting_started/llm_gateway/README.md
+++ b/demos/getting_started/llm_gateway/README.md
@ -7,7 +7,7 @@ This demo shows how you can use Plano gateway to manage keys and route to upstre
   ```sh
   sh run_demo.sh
   ```
-1. Navigate to http://localhost:18080/
+1. Navigate to http://localhost:3001/

 Following screen shows an example of interaction with Plano gateway showing dynamic routing. You can select between different LLMs using "override model" option in the chat UI.

@ -32,7 +32,7 @@ $ curl --header 'Content-Type: application/json' \
      "messages": {
        "role": "assistant",
        "tool_calls": null,
-        "content": "Hello! How can I assist you today? Let's chat about anything you'd like. 😊"
+        "content": "Hello! How can I assist you today? Let's chat about anything you'd like."
      },
      "finish_reason": "stop"
    }
@ -47,11 +47,7 @@ $ curl --header 'Content-Type: application/json' \
 ```

 # Observability
-Plano gateway publishes stats endpoint at http://localhost:19901/stats. In this demo we are using prometheus to pull stats from Plano and we are using grafana to visualize the stats in dashboard. To see grafana dashboard follow instructions below,
-
-1. Navigate to http://localhost:3000/ to open grafana UI (use admin/grafana as credentials)
-1. From grafana left nav click on dashboards and select "Intelligent Gateway Overview" to view Plano gateway stats
-1. For tracing you can head over to http://localhost:16686/ to view recent traces.
+For tracing you can head over to http://localhost:16686/ to view recent traces.

 Following is a screenshot of tracing UI showing call received by Plano gateway and making upstream call to LLM,

--- a/demos/getting_started/llm_gateway/config.yaml
+++ b/demos/getting_started/llm_gateway/config.yaml
--- a/demos/getting_started/llm_gateway/docker-compose.yaml
+++ b/demos/getting_started/llm_gateway/docker-compose.yaml
@ -37,13 +37,3 @@ services:
      - "16686:16686"
      - "4317:4317"
      - "4318:4318"
-
-  prometheus:
-    build:
-      context: ../../shared/prometheus
-
-  grafana:
-    build:
-      context: ../../shared/grafana
-    ports:
-      - "3000:3000"
--- a/demos/getting_started/llm_gateway/jaeger_tracing_llm_routing.png
+++ b/demos/getting_started/llm_gateway/jaeger_tracing_llm_routing.png
--- a/demos/getting_started/llm_gateway/llm_routing_demo.png
+++ b/demos/getting_started/llm_gateway/llm_routing_demo.png
--- a/demos/getting_started/llm_gateway/run_demo.sh
+++ b/demos/getting_started/llm_gateway/run_demo.sh
--- a/demos/getting_started/weather_forecast/Dockerfile
+++ b/demos/getting_started/weather_forecast/Dockerfile
--- a/demos/getting_started/weather_forecast/README.md
+++ b/demos/getting_started/weather_forecast/README.md
@ -0,0 +1,28 @@
+# Function calling
+
+This demo shows how you can use Plano's core function calling capabilities.
+
+# Starting the demo
+
+1. Please make sure the [pre-requisites](https://github.com/katanemo/arch/?tab=readme-ov-file#prerequisites) are installed correctly
+2. Start Plano
+
+3. ```sh
+   sh run_demo.sh
+   ```
+4. Navigate to http://localhost:3001/
+5. You can type in queries like "how is the weather?"
+
+Here is a sample interaction,
+<img width="575" alt="image" src="https://github.com/user-attachments/assets/e0929490-3eb2-4130-ae87-a732aea4d059">
+
+## Tracing
+
+To see a tracing dashboard, navigate to http://localhost:16686/ to open Jaeger UI.
+
+### Stopping Demo
+
+1. To end the demo, run the following command:
+   ```sh
+   sh run_demo.sh down
+   ```
--- a/demos/getting_started/weather_forecast/config.yaml
+++ b/demos/getting_started/weather_forecast/config.yaml
@ -1,17 +1,13 @@
-version: v0.1.0
+version: v0.3.0

 listeners:
-  ingress_traffic:
-    address: 0.0.0.0
+  - type: prompt
+    name: prompt_listener
    port: 10000
-    message_format: openai
-    timeout: 30s

-  egress_traffic:
-    address: 0.0.0.0
+  - type: model
+    name: model_listener
    port: 12000
-    message_format: openai
-    timeout: 30s

 endpoints:
  weather_forecast_service:
@ -22,7 +18,7 @@ overrides:
  # confidence threshold for prompt target intent matching
  prompt_target_intent_matching_threshold: 0.6

-llm_providers:
+model_providers:
  - access_key: $GROQ_API_KEY
    model: groq/llama-3.2-3b-preview

--- a/demos/getting_started/weather_forecast/docker-compose.yaml
+++ b/demos/getting_started/weather_forecast/docker-compose.yaml
@ -0,0 +1,27 @@
+services:
+  weather_forecast_service:
+    build:
+      context: ./
+    environment:
+      - OLTP_HOST=http://jaeger:4317
+    extra_hosts:
+      - "host.docker.internal:host-gateway"
+    ports:
+      - "18083:80"
+
+  anythingllm:
+    image: mintplexlabs/anythingllm
+    restart: always
+    ports:
+      - "3001:3001"
+    cap_add:
+      - SYS_ADMIN
+    environment:
+      - STORAGE_DIR=/app/server/storage
+      - LLM_PROVIDER=generic-openai
+      - GENERIC_OPEN_AI_BASE_PATH=http://host.docker.internal:10000/v1
+      - GENERIC_OPEN_AI_MODEL_PREF=gpt-4o-mini
+      - GENERIC_OPEN_AI_MODEL_TOKEN_LIMIT=128000
+      - GENERIC_OPEN_AI_API_KEY=sk-placeholder
+    extra_hosts:
+      - "host.docker.internal:host-gateway"
--- a/demos/getting_started/weather_forecast/hurl_tests/simple.hurl
+++ b/demos/getting_started/weather_forecast/hurl_tests/simple.hurl
--- a/demos/getting_started/weather_forecast/hurl_tests/simple_stream.hurl
+++ b/demos/getting_started/weather_forecast/hurl_tests/simple_stream.hurl
--- a/demos/getting_started/weather_forecast/main.py
+++ b/demos/getting_started/weather_forecast/main.py
--- a/demos/getting_started/weather_forecast/pyproject.toml
+++ b/demos/getting_started/weather_forecast/pyproject.toml
--- a/demos/getting_started/weather_forecast/run_demo.sh
+++ b/demos/getting_started/weather_forecast/run_demo.sh
--- a/Show more
+++ b/Show more