From 56a9ac3ba9fde0d101e88ff789e825dc6b7243f4 Mon Sep 17 00:00:00 2001 From: cybermaggedon Date: Tue, 1 Oct 2024 21:04:55 +0100 Subject: [PATCH] Change LLM latency dashboard to be rate & bump version (#92) --- Makefile | 2 +- grafana/dashboards/dashboard.json | 12 ++++++++---- 2 files changed, 9 insertions(+), 5 deletions(-) diff --git a/Makefile b/Makefile index 4c8aaec2..d9366c4f 100644 --- a/Makefile +++ b/Makefile @@ -1,6 +1,6 @@ # VERSION=$(shell git describe | sed 's/^v//') -VERSION=0.11.14 +VERSION=0.11.15 DOCKER=podman diff --git a/grafana/dashboards/dashboard.json b/grafana/dashboards/dashboard.json index e2db0f09..04561863 100644 --- a/grafana/dashboards/dashboard.json +++ b/grafana/dashboards/dashboard.json @@ -90,14 +90,18 @@ "type": "prometheus", "uid": "f6b18033-5918-4e05-a1ca-4cb30343b129" }, - "editorMode": "code", + "disableTextWrap": false, + "editorMode": "builder", "exemplar": false, - "expr": "max by(le) (text_completion_duration_bucket)", + "expr": "sum by(le) (rate(text_completion_duration_bucket[$__rate_interval]))", "format": "heatmap", + "fullMetaSearch": false, + "includeNullMetadata": true, "instant": false, "legendFormat": "99%", "range": true, - "refId": "A" + "refId": "A", + "useBackend": false } ], "title": "LLM latency", @@ -1136,7 +1140,7 @@ "list": [] }, "time": { - "from": "now-5m", + "from": "now-15m", "to": "now" }, "timepicker": {},