update weather_forecast demo to spin up grafana and prometheus when using monitoring profile

has full dashboard with total requests, time per output token, time to
first token, total latency, output sequence length, and input sequence
length.
This commit is contained in:
aayushwhiz 2024-11-11 17:00:48 -08:00
parent f4e9624c03
commit 6fc32b0152
6 changed files with 772 additions and 1 deletions

View file

@ -290,7 +290,7 @@ fn llm_gateway_request_ratelimited() {
let args = tester::MockSettings {
wasm_path: wasm_module(),
quiet: false,
allow_unexpected: true,
allow_unexpected: false,
};
let mut module = tester::mock(args).unwrap();