From a0d132f5b6f16827c9a525696fd53589e8e02e5b Mon Sep 17 00:00:00 2001 From: Adil Hafeez Date: Mon, 16 Sep 2024 19:21:59 -0700 Subject: [PATCH] remove unused demos --- demos/weather-forecast-local-llm/README.md | 22 -- .../docker-compose.yaml | 89 ----- .../download_mistral_7b.sh | 1 - .../grafana/dashboard.yaml | 12 - .../grafana/dashboards/envoy_overview.json | 355 ------------------ .../grafana/datasource.yaml | 9 - .../katanemo-config.yaml | 46 --- .../prometheus/prometheus.yaml | 23 -- demos/weather-forecast/README.md | 19 - demos/weather-forecast/docker-compose.yaml | 80 ---- demos/weather-forecast/grafana/dashboard.yaml | 12 - .../grafana/dashboards/envoy_overview.json | 355 ------------------ .../weather-forecast/grafana/datasource.yaml | 9 - demos/weather-forecast/katanemo-config.yaml | 42 --- .../prometheus/prometheus.yaml | 23 -- 15 files changed, 1097 deletions(-) delete mode 100644 demos/weather-forecast-local-llm/README.md delete mode 100644 demos/weather-forecast-local-llm/docker-compose.yaml delete mode 100644 demos/weather-forecast-local-llm/download_mistral_7b.sh delete mode 100644 demos/weather-forecast-local-llm/grafana/dashboard.yaml delete mode 100644 demos/weather-forecast-local-llm/grafana/dashboards/envoy_overview.json delete mode 100644 demos/weather-forecast-local-llm/grafana/datasource.yaml delete mode 100644 demos/weather-forecast-local-llm/katanemo-config.yaml delete mode 100644 demos/weather-forecast-local-llm/prometheus/prometheus.yaml delete mode 100644 demos/weather-forecast/README.md delete mode 100644 demos/weather-forecast/docker-compose.yaml delete mode 100644 demos/weather-forecast/grafana/dashboard.yaml delete mode 100644 demos/weather-forecast/grafana/dashboards/envoy_overview.json delete mode 100644 demos/weather-forecast/grafana/datasource.yaml delete mode 100644 demos/weather-forecast/katanemo-config.yaml delete mode 100644 demos/weather-forecast/prometheus/prometheus.yaml diff --git a/demos/weather-forecast-local-llm/README.md b/demos/weather-forecast-local-llm/README.md deleted file mode 100644 index 885ace4a..00000000 --- a/demos/weather-forecast-local-llm/README.md +++ /dev/null @@ -1,22 +0,0 @@ -# Weather forecasting -This demo shows how you can use intelligent prompt gateway to provide realtime weather forecast using Mistral LLM locally hosted using llama.cpp as LLM Hosting Service. - -# Startig the demo -1. Ensure that submodule is up to date - ```sh - git submodule sync --recursive - ``` -1. Download mistral 7b model using following shell command - ```sh - sh download_mistral_7b.sh - ``` -2. Start services - ```sh - docker compose up - ``` -3. Navigate to http://localhost:18080/ -4. You can type in queries like "how is the weather in Seattle" - 1. You can also ask follow up questions like "show me sunny days" -5. To see metrics navigate to "http://localhost:3000/" (use admin/grafana for login) - 1. Open up dahsboard named "Intelligent Gateway Overview" - 2. On this dashboard you can see reuqest latency and number of requests diff --git a/demos/weather-forecast-local-llm/docker-compose.yaml b/demos/weather-forecast-local-llm/docker-compose.yaml deleted file mode 100644 index 369511df..00000000 --- a/demos/weather-forecast-local-llm/docker-compose.yaml +++ /dev/null @@ -1,89 +0,0 @@ -services: - config-generator: - build: - context: ../../ - dockerfile: config_generator/Dockerfile - volumes: - - ../../envoyfilter/envoy.template.yaml:/usr/src/app/envoy.template.yaml - - ./katanemo-config.yaml:/usr/src/app/katanemo-config.yaml - - ./generated:/usr/src/app/out - envoy: - build: - context: ../../ - dockerfile: envoyfilter/Dockerfile - hostname: envoy - ports: - - "10000:10000" - - "19901:9901" - volumes: - - ./generated/envoy.yaml:/etc/envoy/envoy.yaml - - /etc/ssl/cert.pem:/etc/ssl/cert.pem - depends_on: - config-generator: - condition: service_completed_successfully - embeddingserver: - condition: service_healthy - - embeddingserver: - build: - context: ../../embedding-server - dockerfile: Dockerfile - ports: - - "18081:80" - healthcheck: - test: ["CMD", "curl" ,"http://localhost:80/healthz"] - interval: 5s - retries: 20 - volumes: - - ~/.cache/huggingface:/root/.cache/huggingface - qdrant: - image: qdrant/qdrant - hostname: vector-db - ports: - - 16333:6333 - - 16334:6334 - - chatbot-ui: - build: - context: ../../chatbot-ui - dockerfile: Dockerfile - ports: - - "18080:8080" - environment: - - OPENAI_API_KEY=${OPENAI_API_KEY} - - CHAT_COMPLETION_ENDPOINT=http://envoy:10000/v1/chat/completions - - prometheus: - image: prom/prometheus - container_name: prometheus - command: - - '--config.file=/etc/prometheus/prometheus.yaml' - ports: - - 9090:9090 - restart: unless-stopped - volumes: - - ./prometheus:/etc/prometheus - - ./prom_data:/prometheus - - grafana: - image: grafana/grafana - container_name: grafana - ports: - - 3000:3000 - restart: unless-stopped - environment: - - GF_SECURITY_ADMIN_USER=admin - - GF_SECURITY_ADMIN_PASSWORD=grafana - volumes: - - ./grafana:/etc/grafana/provisioning/datasources - - ./grafana/dashboard.yaml:/etc/grafana/provisioning/dashboards/main.yaml - - ./grafana/dashboards:/var/lib/grafana/dashboards - - mistral_7b_instruct: - image: ghcr.io/ggerganov/llama.cpp:server - hostname: mistral_7b_instruct - ports: - - "10001:10001" - volumes: - - ./mistral-7b-instruct-v0.2.Q4_K_M.gguf:/models/model.gguf - command: ["--host", "0.0.0.0", "--port", "10001", "-m", "/models/model.gguf"] diff --git a/demos/weather-forecast-local-llm/download_mistral_7b.sh b/demos/weather-forecast-local-llm/download_mistral_7b.sh deleted file mode 100644 index f3b682ec..00000000 --- a/demos/weather-forecast-local-llm/download_mistral_7b.sh +++ /dev/null @@ -1 +0,0 @@ -huggingface-cli download TheBloke/Mistral-7B-Instruct-v0.2-GGUF mistral-7b-instruct-v0.2.Q4_K_M.gguf --local-dir . --local-dir-use-symlinks False diff --git a/demos/weather-forecast-local-llm/grafana/dashboard.yaml b/demos/weather-forecast-local-llm/grafana/dashboard.yaml deleted file mode 100644 index fd66a479..00000000 --- a/demos/weather-forecast-local-llm/grafana/dashboard.yaml +++ /dev/null @@ -1,12 +0,0 @@ -apiVersion: 1 - -providers: - - name: "Dashboard provider" - orgId: 1 - type: file - disableDeletion: false - updateIntervalSeconds: 10 - allowUiUpdates: false - options: - path: /var/lib/grafana/dashboards - foldersFromFilesStructure: true diff --git a/demos/weather-forecast-local-llm/grafana/dashboards/envoy_overview.json b/demos/weather-forecast-local-llm/grafana/dashboards/envoy_overview.json deleted file mode 100644 index 51bff777..00000000 --- a/demos/weather-forecast-local-llm/grafana/dashboards/envoy_overview.json +++ /dev/null @@ -1,355 +0,0 @@ -{ - "annotations": { - "list": [ - { - "builtIn": 1, - "datasource": { - "type": "grafana", - "uid": "-- Grafana --" - }, - "enable": true, - "hide": true, - "iconColor": "rgba(0, 211, 255, 1)", - "name": "Annotations & Alerts", - "type": "dashboard" - } - ] - }, - "editable": true, - "fiscalYearStartMonth": 0, - "graphTooltip": 1, - "links": [], - "panels": [ - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "auto", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 12, - "x": 0, - "y": 0 - }, - "id": 2, - "options": { - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "disableTextWrap": false, - "editorMode": "code", - "expr": "avg(rate(envoy_cluster_internal_upstream_rq_time_sum[1m]) / rate(envoy_cluster_internal_upstream_rq_time_count[1m])) by (envoy_cluster_name)", - "fullMetaSearch": false, - "hide": false, - "includeNullMetadata": true, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A", - "useBackend": false - } - ], - "title": "request latency - internal (ms)", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "auto", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 12, - "x": 12, - "y": 0 - }, - "id": 1, - "options": { - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "disableTextWrap": false, - "editorMode": "code", - "expr": "avg(rate(envoy_cluster_external_upstream_rq_time_sum[1m]) / rate(envoy_cluster_external_upstream_rq_time_count[1m])) by (envoy_cluster_name)", - "fullMetaSearch": false, - "hide": false, - "includeNullMetadata": true, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A", - "useBackend": false - } - ], - "title": "request latency - external (ms)", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "auto", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 12, - "x": 0, - "y": 8 - }, - "id": 3, - "options": { - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "disableTextWrap": false, - "editorMode": "code", - "expr": "avg(rate(envoy_cluster_internal_upstream_rq_completed[1m])) by (envoy_cluster_name)", - "fullMetaSearch": false, - "includeNullMetadata": true, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A", - "useBackend": false - }, - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "disableTextWrap": false, - "editorMode": "code", - "expr": "avg(rate(envoy_cluster_external_upstream_rq_completed[1m])) by (envoy_cluster_name)", - "fullMetaSearch": false, - "hide": false, - "includeNullMetadata": true, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "B", - "useBackend": false - } - ], - "title": "Upstream request count", - "type": "timeseries" - } - ], - "schemaVersion": 39, - "tags": [], - "templating": { - "list": [] - }, - "time": { - "from": "now-15m", - "to": "now" - }, - "timepicker": {}, - "timezone": "browser", - "title": "Intelligent Gateway Overview", - "uid": "adt6uhx5lk8aob", - "version": 3, - "weekStart": "" -} diff --git a/demos/weather-forecast-local-llm/grafana/datasource.yaml b/demos/weather-forecast-local-llm/grafana/datasource.yaml deleted file mode 100644 index 4870174e..00000000 --- a/demos/weather-forecast-local-llm/grafana/datasource.yaml +++ /dev/null @@ -1,9 +0,0 @@ -apiVersion: 1 - -datasources: -- name: Prometheus - type: prometheus - url: http://prometheus:9090 - isDefault: true - access: proxy - editable: true diff --git a/demos/weather-forecast-local-llm/katanemo-config.yaml b/demos/weather-forecast-local-llm/katanemo-config.yaml deleted file mode 100644 index de772cce..00000000 --- a/demos/weather-forecast-local-llm/katanemo-config.yaml +++ /dev/null @@ -1,46 +0,0 @@ -default_prompt_endpoint: "127.0.0.1" -load_balancing: "round_robin" -timeout_ms: 5000 - -embedding_provider: - name: "SentenceTransformer" - model: "all-MiniLM-L6-v2" - -llm_providers: - - - name: open-ai-gpt-4 - api_key: "$OPEN_AI_API_KEY" - model: gpt-4 - - - name: mistral_7b_instruct - model: mistral-7b-instruct - endpoint: http://mistral_7b_instruct:10001/v1/chat/completions - default: true - -prompt_targets: - - - type: context_resolver - name: weather_forecast - few_shot_examples: - - what is the weather in New York? - - how is the weather in San Francisco? - - what is the forecast in Chicago? - entities: - - name: city - required: true - - name: days - endpoint: - cluster: weatherhost - path: /weather - system_prompt: | - You are a helpful weather forecaster. Use weater data that is provided to you. Please following following guidelines when responding to user queries: - - Use farenheight for temperature - - Use miles per hour for wind speed - -#TODO: add support for adding custom clusters e.g. - # clusters: - # qdrant: - # options: - # - address: "qdrant" - # - address: "weatherhost" - # - port: 6333 diff --git a/demos/weather-forecast-local-llm/prometheus/prometheus.yaml b/demos/weather-forecast-local-llm/prometheus/prometheus.yaml deleted file mode 100644 index 5aa25e0d..00000000 --- a/demos/weather-forecast-local-llm/prometheus/prometheus.yaml +++ /dev/null @@ -1,23 +0,0 @@ -global: - scrape_interval: 15s - scrape_timeout: 10s - evaluation_interval: 15s -alerting: - alertmanagers: - - static_configs: - - targets: [] - scheme: http - timeout: 10s - api_version: v1 -scrape_configs: -- job_name: envoy - honor_timestamps: true - scrape_interval: 15s - scrape_timeout: 10s - metrics_path: /stats - scheme: http - static_configs: - - targets: - - envoy:9901 - params: - format: ['prometheus'] diff --git a/demos/weather-forecast/README.md b/demos/weather-forecast/README.md deleted file mode 100644 index dec35d4b..00000000 --- a/demos/weather-forecast/README.md +++ /dev/null @@ -1,19 +0,0 @@ -# Weather forecasting -This demo shows how you can use intelligent prompt gateway to provide realtime weather forecast. - -# Startig the demo -1. Ensure that submodule is up to date - ```sh - git submodule sync --recursive - ``` -1. Create `.env` file and set OpenAI key using env var `OPENAI_API_KEY` -1. Start services - ```sh - docker compose up - ``` -1. Navigate to http://localhost:18080/ -1. You can type in queries like "how is the weather in Seattle" - 1. You can also ask follow up questions like "show me sunny days" -1. To see metrics navigate to "http://localhost:3000/" (use admin/grafana for login) - 1. Open up dahsboard named "Intelligent Gateway Overview" - 2. On this dashboard you can see reuqest latency and number of requests diff --git a/demos/weather-forecast/docker-compose.yaml b/demos/weather-forecast/docker-compose.yaml deleted file mode 100644 index 28480588..00000000 --- a/demos/weather-forecast/docker-compose.yaml +++ /dev/null @@ -1,80 +0,0 @@ -services: - config-generator: - build: - context: ../../ - dockerfile: config_generator/Dockerfile - volumes: - - ../../envoyfilter/envoy.template.yaml:/usr/src/app/envoy.template.yaml - - ./katanemo-config.yaml:/usr/src/app/katanemo-config.yaml - - ./generated:/usr/src/app/out - envoy: - build: - context: ../../ - dockerfile: envoyfilter/Dockerfile - hostname: envoy - ports: - - "10000:10000" - - "19901:9901" - volumes: - - ./generated/envoy.yaml:/etc/envoy/envoy.yaml - - /etc/ssl/cert.pem:/etc/ssl/cert.pem - depends_on: - config-generator: - condition: service_completed_successfully - embeddingserver: - condition: service_healthy - - embeddingserver: - build: - context: ../../embedding-server - dockerfile: Dockerfile - ports: - - "18081:80" - healthcheck: - test: ["CMD", "curl" ,"http://localhost:80/healthz"] - interval: 5s - retries: 20 - volumes: - - ~/.cache/huggingface:/root/.cache/huggingface - qdrant: - image: qdrant/qdrant - hostname: vector-db - ports: - - 16333:6333 - - 16334:6334 - - chatbot-ui: - build: - context: ../../chatbot-ui - dockerfile: Dockerfile - ports: - - "18080:8080" - environment: - - OPENAI_API_KEY=${OPENAI_API_KEY} - - CHAT_COMPLETION_ENDPOINT=http://envoy:10000/v1/chat/completions - - prometheus: - image: prom/prometheus - container_name: prometheus - command: - - '--config.file=/etc/prometheus/prometheus.yaml' - ports: - - 9090:9090 - restart: unless-stopped - volumes: - - ./prometheus:/etc/prometheus - - ./prom_data:/prometheus - - grafana: - image: grafana/grafana - container_name: grafana - ports: - - 3000:3000 - restart: unless-stopped - environment: - - GF_SECURITY_ADMIN_USER=admin - - GF_SECURITY_ADMIN_PASSWORD=grafana - volumes: - - ./grafana:/etc/grafana/provisioning/datasources - - ./grafana/dashboard.yaml:/etc/grafana/provisioning/dashboards/main.yaml - - ./grafana/dashboards:/var/lib/grafana/dashboards diff --git a/demos/weather-forecast/grafana/dashboard.yaml b/demos/weather-forecast/grafana/dashboard.yaml deleted file mode 100644 index fd66a479..00000000 --- a/demos/weather-forecast/grafana/dashboard.yaml +++ /dev/null @@ -1,12 +0,0 @@ -apiVersion: 1 - -providers: - - name: "Dashboard provider" - orgId: 1 - type: file - disableDeletion: false - updateIntervalSeconds: 10 - allowUiUpdates: false - options: - path: /var/lib/grafana/dashboards - foldersFromFilesStructure: true diff --git a/demos/weather-forecast/grafana/dashboards/envoy_overview.json b/demos/weather-forecast/grafana/dashboards/envoy_overview.json deleted file mode 100644 index 51bff777..00000000 --- a/demos/weather-forecast/grafana/dashboards/envoy_overview.json +++ /dev/null @@ -1,355 +0,0 @@ -{ - "annotations": { - "list": [ - { - "builtIn": 1, - "datasource": { - "type": "grafana", - "uid": "-- Grafana --" - }, - "enable": true, - "hide": true, - "iconColor": "rgba(0, 211, 255, 1)", - "name": "Annotations & Alerts", - "type": "dashboard" - } - ] - }, - "editable": true, - "fiscalYearStartMonth": 0, - "graphTooltip": 1, - "links": [], - "panels": [ - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "auto", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 12, - "x": 0, - "y": 0 - }, - "id": 2, - "options": { - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "disableTextWrap": false, - "editorMode": "code", - "expr": "avg(rate(envoy_cluster_internal_upstream_rq_time_sum[1m]) / rate(envoy_cluster_internal_upstream_rq_time_count[1m])) by (envoy_cluster_name)", - "fullMetaSearch": false, - "hide": false, - "includeNullMetadata": true, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A", - "useBackend": false - } - ], - "title": "request latency - internal (ms)", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "auto", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 12, - "x": 12, - "y": 0 - }, - "id": 1, - "options": { - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "disableTextWrap": false, - "editorMode": "code", - "expr": "avg(rate(envoy_cluster_external_upstream_rq_time_sum[1m]) / rate(envoy_cluster_external_upstream_rq_time_count[1m])) by (envoy_cluster_name)", - "fullMetaSearch": false, - "hide": false, - "includeNullMetadata": true, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A", - "useBackend": false - } - ], - "title": "request latency - external (ms)", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "auto", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 12, - "x": 0, - "y": 8 - }, - "id": 3, - "options": { - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "disableTextWrap": false, - "editorMode": "code", - "expr": "avg(rate(envoy_cluster_internal_upstream_rq_completed[1m])) by (envoy_cluster_name)", - "fullMetaSearch": false, - "includeNullMetadata": true, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A", - "useBackend": false - }, - { - "datasource": { - "type": "prometheus", - "uid": "PBFA97CFB590B2093" - }, - "disableTextWrap": false, - "editorMode": "code", - "expr": "avg(rate(envoy_cluster_external_upstream_rq_completed[1m])) by (envoy_cluster_name)", - "fullMetaSearch": false, - "hide": false, - "includeNullMetadata": true, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "B", - "useBackend": false - } - ], - "title": "Upstream request count", - "type": "timeseries" - } - ], - "schemaVersion": 39, - "tags": [], - "templating": { - "list": [] - }, - "time": { - "from": "now-15m", - "to": "now" - }, - "timepicker": {}, - "timezone": "browser", - "title": "Intelligent Gateway Overview", - "uid": "adt6uhx5lk8aob", - "version": 3, - "weekStart": "" -} diff --git a/demos/weather-forecast/grafana/datasource.yaml b/demos/weather-forecast/grafana/datasource.yaml deleted file mode 100644 index 4870174e..00000000 --- a/demos/weather-forecast/grafana/datasource.yaml +++ /dev/null @@ -1,9 +0,0 @@ -apiVersion: 1 - -datasources: -- name: Prometheus - type: prometheus - url: http://prometheus:9090 - isDefault: true - access: proxy - editable: true diff --git a/demos/weather-forecast/katanemo-config.yaml b/demos/weather-forecast/katanemo-config.yaml deleted file mode 100644 index 293d57a0..00000000 --- a/demos/weather-forecast/katanemo-config.yaml +++ /dev/null @@ -1,42 +0,0 @@ -default_prompt_endpoint: "127.0.0.1" -load_balancing: "round_robin" -timeout_ms: 5000 - -embedding_provider: - name: "SentenceTransformer" - model: "all-MiniLM-L6-v2" - -llm_providers: - - - name: open-ai-gpt-4 - api_key: $OPEN_AI_API_KEY - model: gpt-4 - default: true - -prompt_targets: - - - type: context_resolver - name: weather_forecast - few_shot_examples: - - what is the weather in New York? - - how is the weather in San Francisco? - - what is the forecast in Chicago? - entities: - - name: city - required: true - - name: days - endpoint: - cluster: weatherhost - path: /weather - system_prompt: | - You are a helpful weather forecaster. Use weater data that is provided to you. Please following following guidelines when responding to user queries: - - Use farenheight for temperature - - Use miles per hour for wind speed - -#TODO: add support for adding custom clusters e.g. - # clusters: - # qdrant: - # options: - # - address: "qdrant" - # - address: "weatherhost" - # - port: 6333 diff --git a/demos/weather-forecast/prometheus/prometheus.yaml b/demos/weather-forecast/prometheus/prometheus.yaml deleted file mode 100644 index 5aa25e0d..00000000 --- a/demos/weather-forecast/prometheus/prometheus.yaml +++ /dev/null @@ -1,23 +0,0 @@ -global: - scrape_interval: 15s - scrape_timeout: 10s - evaluation_interval: 15s -alerting: - alertmanagers: - - static_configs: - - targets: [] - scheme: http - timeout: 10s - api_version: v1 -scrape_configs: -- job_name: envoy - honor_timestamps: true - scrape_interval: 15s - scrape_timeout: 10s - metrics_path: /stats - scheme: http - static_configs: - - targets: - - envoy:9901 - params: - format: ['prometheus']