mirror of
https://github.com/katanemo/plano.git
synced 2026-06-17 15:25:17 +02:00
update weather_forecast demo to spin up grafana and prometheus when using monitoring profile
has full dashboard with total requests, time per output token, time to first token, total latency, output sequence length, and input sequence length.
This commit is contained in:
parent
f4e9624c03
commit
6fc32b0152
6 changed files with 772 additions and 1 deletions
|
|
@ -290,7 +290,7 @@ fn llm_gateway_request_ratelimited() {
|
|||
let args = tester::MockSettings {
|
||||
wasm_path: wasm_module(),
|
||||
quiet: false,
|
||||
allow_unexpected: true,
|
||||
allow_unexpected: false,
|
||||
};
|
||||
let mut module = tester::mock(args).unwrap();
|
||||
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue