mirror of
https://github.com/katanemo/plano.git
synced 2026-04-30 03:16:28 +02:00
Add in tpot (#269)
* add in tpot and tokens per second * add in debug logs for new stats and update integration tests * update shared dashboard to include new stats
This commit is contained in:
parent
9eeb790c7f
commit
1d229cba8f
4 changed files with 252 additions and 28 deletions
|
|
@ -75,6 +75,8 @@ fn setup_filter(module: &mut Tester, config: &str) -> i32 {
|
|||
.expect_metric_creation(MetricType::Gauge, "active_http_calls")
|
||||
.expect_metric_creation(MetricType::Counter, "ratelimited_rq")
|
||||
.expect_metric_creation(MetricType::Histogram, "time_to_first_token")
|
||||
.expect_metric_creation(MetricType::Histogram, "time_per_output_token")
|
||||
.expect_metric_creation(MetricType::Histogram, "tokens_per_second")
|
||||
.expect_metric_creation(MetricType::Histogram, "request_latency")
|
||||
.expect_metric_creation(MetricType::Histogram, "output_sequence_length")
|
||||
.expect_metric_creation(MetricType::Histogram, "input_sequence_length")
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue