mirror of
https://github.com/katanemo/plano.git
synced 2026-06-17 15:25:17 +02:00
update rust side to handle default targets
This commit is contained in:
parent
6be6cc6346
commit
866494da27
5 changed files with 113 additions and 76 deletions
|
|
@ -171,7 +171,7 @@ class ArchBaseHandler:
|
|||
assert processed_messages[-1]["role"] == "user"
|
||||
|
||||
if extra_instruction:
|
||||
processed_messages[-1]["content"] += extra_instruction
|
||||
processed_messages[-1]["content"] += "\n" + extra_instruction
|
||||
|
||||
# keep the first system message and shift conversation if the total token length exceeds the limit
|
||||
def truncate_messages(messages: List[Dict[str, Any]]):
|
||||
|
|
|
|||
|
|
@ -104,7 +104,7 @@ async def function_calling(req: ChatMessage, res: Response):
|
|||
res.status_code = 500
|
||||
error_messages = f"[Arch-Function] - Error in ChatCompletion: {e}"
|
||||
else:
|
||||
# TODO: make a call to default LLM to get responses
|
||||
# no intent matched
|
||||
intent_response.metadata = {
|
||||
"intent_latency": str(round(intent_latency * 1000, 3)),
|
||||
}
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue