plano/chatbot_ui/app/run.py
Adil Hafeez 96686dc606
Serialize tool calls for Arch FC (#131)
* Serialize tool calls

* fix int tests
2024-10-07 00:03:25 -07:00

76 lines
2.7 KiB
Python

import json
import os
from openai import OpenAI, DefaultHttpxClient
import gradio as gr
import logging as log
from dotenv import load_dotenv
load_dotenv()
OPENAI_API_KEY=os.getenv("OPENAI_API_KEY")
MISTRAL_API_KEY = os.getenv("MISTRAL_API_KEY")
CHAT_COMPLETION_ENDPOINT = os.getenv("CHAT_COMPLETION_ENDPOINT")
MODEL_NAME = os.getenv("MODEL_NAME", "gpt-3.5-turbo")
ARCH_STATE_HEADER = 'x-arch-state'
log.info("CHAT_COMPLETION_ENDPOINT: ", CHAT_COMPLETION_ENDPOINT)
client = OpenAI(api_key=OPENAI_API_KEY, base_url=CHAT_COMPLETION_ENDPOINT, http_client=DefaultHttpxClient(headers={"accept-encoding": "*"}))
def predict(message, state):
if 'history' not in state:
state['history'] = []
history = state.get("history")
history.append({"role": "user", "content": message})
log.info("history: ", history)
# Custom headers
custom_headers = {
'x-arch-openai-api-key': f"{OPENAI_API_KEY}",
'x-arch-mistral-api-key': f"{MISTRAL_API_KEY}",
'x-arch-deterministic-provider': 'openai',
}
metadata = None
if 'arch_state' in state:
metadata = {ARCH_STATE_HEADER: state['arch_state']}
try:
raw_response = client.chat.completions.with_raw_response.create(model=MODEL_NAME,
messages = history,
temperature=1.0,
metadata=metadata,
extra_headers=custom_headers
)
except Exception as e:
log.info(e)
# remove last user message in case of exception
history.pop()
log.info("Error calling gateway API: {}".format(e.message))
raise gr.Error("Error calling gateway API: {}".format(e.message))
log.debug("raw_response: ", raw_response.text)
response = raw_response.parse()
# extract arch_state from metadata and store it in gradio session state
# this state must be passed back to the gateway in the next request
arch_state = json.loads(raw_response.text).get('metadata', {}).get(ARCH_STATE_HEADER, None)
if arch_state:
state['arch_state'] = arch_state
content = response.choices[0].message.content
history.append({"role": "assistant", "content": content, "model": response.model})
messages = [(history[i]["content"], history[i+1]["content"]) for i in range(0, len(history)-1, 2)]
return messages, state
with gr.Blocks(fill_height=True, css="footer {visibility: hidden}") as demo:
print("Starting Demo...")
chatbot = gr.Chatbot(label="Arch Chatbot", scale=1)
state = gr.State({})
with gr.Row():
txt = gr.Textbox(show_label=False, placeholder="Enter text and press enter", scale=1, autofocus=True)
txt.submit(predict, [txt, state], [chatbot, state])
demo.launch(server_name="0.0.0.0", server_port=8080, show_error=True, debug=True)