mirror of
https://github.com/katanemo/plano.git
synced 2026-06-23 15:38:07 +02:00
send latency numbers from model_server as metadata
This commit is contained in:
parent
14625e2a1d
commit
60dfb18018
4 changed files with 9 additions and 6 deletions
|
|
@ -124,7 +124,8 @@ impl StreamContext {
|
|||
let arch_fc_response: ChatCompletionsResponse = match serde_json::from_str(&body_str) {
|
||||
Ok(arch_fc_response) => arch_fc_response,
|
||||
Err(e) => {
|
||||
warn!("error deserializing archfc response: {}", e);
|
||||
warn!("error deserializing archfc response: {}, body: {}", e, body_str
|
||||
);
|
||||
return self.send_server_error(ServerError::Deserialization(e), None);
|
||||
}
|
||||
};
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue