plano/chatbot_ui/run.py

import json
import os
import logging
import yaml
from common import get_arch_messages, get_prompt_targets
import gradio as gr

from typing import List, Optional, Tuple
from openai import OpenAI
from dotenv import load_dotenv

load_dotenv()


logging.basicConfig(
    level=logging.INFO,
    format="%(asctime)s - %(levelname)s - %(message)s",
)

log = logging.getLogger(__name__)

CHAT_COMPLETION_ENDPOINT = os.getenv("CHAT_COMPLETION_ENDPOINT")
log.info(f"CHAT_COMPLETION_ENDPOINT: {CHAT_COMPLETION_ENDPOINT}")


CSS_STYLE = """
.json-container {
    height: 95vh !important;
    overflow-y: auto !important;
}
.chatbot {
    height: calc(95vh - 100px) !important;
    overflow-y: auto !important;
}
footer {visibility: hidden}
"""

client = OpenAI(
    api_key="--",
    base_url=CHAT_COMPLETION_ENDPOINT,
)


def chat(query: Optional[str], conversation: Optional[List[Tuple[str, str]]], state):
    if "history" not in state:
        state["history"] = []

    history = state.get("history")
    history.append({"role": "user", "content": query})
    log.info(f"history: {history}")

    try:
        raw_response = client.chat.completions.with_raw_response.create(
            model="--",
            messages=history,
            temperature=1.0,
        )
    except Exception as e:
        history.pop()
        # remove last user message in case of exception
        log.error("Error calling gateway API: {}".format(e))
        raise gr.Error("Error calling gateway API: {}".format(e))

    log.error(f"raw_response: {raw_response.text}")
    response = raw_response.parse()

    # extract arch_state from metadata and store it in gradio session state
    # this state must be passed back to the gateway in the next request
    response_json = json.loads(raw_response.text)
    log.info(response_json)

    arch_messages = get_arch_messages(response_json)
    for arch_message in arch_messages:
        history.append(arch_message)

    content = response.choices[0].message.content

    history.append({"role": "assistant", "content": content, "model": response.model})

    # for gradio UI we don't want to show raw tool calls and messages from developer application
    # so we're filtering those out
    history_view = [h for h in history if h["role"] != "tool" and "content" in h]

    conversation = [
        (history_view[i]["content"], history_view[i + 1]["content"])
        for i in range(0, len(history_view) - 1, 2)
    ]

    yield "", conversation, state


def main():
    with gr.Blocks(
        theme=gr.themes.Default(
            font_mono=[gr.themes.GoogleFont("IBM Plex Mono"), "Arial", "sans-serif"]
        ),
        fill_height=True,
        css=CSS_STYLE,
    ) as demo:
        with gr.Row(equal_height=True):
            state = gr.State({})

            with gr.Column(scale=4):
                gr.JSON(
                    value=get_prompt_targets(),
                    open=True,
                    show_indices=False,
                    label="Available Tools",
                    scale=1,
                    min_height="95vh",
                    elem_classes="json-container",
                )
            with gr.Column(scale=6):
                chatbot = gr.Chatbot(
                    label="Arch Chatbot",
                    scale=1,
                    elem_classes="chatbot",
                )
                textbox = gr.Textbox(
                    show_label=False,
                    placeholder="Enter text and press enter",
                    scale=1,
                    autofocus=True,
                )

            textbox.submit(chat, [textbox, chatbot, state], [textbox, chatbot, state])

    demo.launch(server_name="0.0.0.0", server_port=8080, show_error=True, debug=True)


if __name__ == "__main__":
    main()
don't compute embeddings for names and other fixes see description (#126) * serialize tools - 2 * fix int tests * fix int test * fix unit tests 2024-10-05 19:25:16 -07:00			`import json`
Add workflow logic for weather forecast demo (#24) 2024-07-30 16:23:23 -07:00			`import os`
Pass tool call and app function response back in metadata (#193) 2024-10-18 13:25:39 -07:00			`import logging`
Update chatbot UI and update hallucination check (#218) * update chatbot UI * Update docker-compose for demos * Fix bugs * fix for emtadata (#219) * fix for emtadata * fix * revert * merge main --------- Co-authored-by: CTran <cotran2@utexas.edu> 2024-10-24 14:11:53 -07:00			`import yaml`
move tools at the bottom and make it collapsed by default 2024-10-29 00:10:11 -07:00			`from common import get_arch_messages, get_prompt_targets`
Update chatbot UI and update hallucination check (#218) * update chatbot UI * Update docker-compose for demos * Fix bugs * fix for emtadata (#219) * fix for emtadata * fix * revert * merge main --------- Co-authored-by: CTran <cotran2@utexas.edu> 2024-10-24 14:11:53 -07:00			`import gradio as gr`

			`from typing import List, Optional, Tuple`
Add support for streaming and fixes few issues (see description) (#202) 2024-10-28 20:05:06 -04:00			`from openai import OpenAI`
fix webui url and dependencies (#66) 2024-09-19 17:48:50 -07:00			`from dotenv import load_dotenv`

			`load_dotenv()`
Add function calling support using bolt-fc-1b (#35) 2024-09-10 14:24:46 -07:00
Add support for streaming and fixes few issues (see description) (#202) 2024-10-28 20:05:06 -04:00
Pass tool call and app function response back in metadata (#193) 2024-10-18 13:25:39 -07:00			`logging.basicConfig(`
			`level=logging.INFO,`
			`format="%(asctime)s - %(levelname)s - %(message)s",`
			`)`

			`log = logging.getLogger(__name__)`

fix webui url and dependencies (#66) 2024-09-19 17:48:50 -07:00			`CHAT_COMPLETION_ENDPOINT = os.getenv("CHAT_COMPLETION_ENDPOINT")`
Pass tool call and app function response back in metadata (#193) 2024-10-18 13:25:39 -07:00			`log.info(f"CHAT_COMPLETION_ENDPOINT: {CHAT_COMPLETION_ENDPOINT}")`
move demo functions out of model_server (#67) * pending * remove * fix docker build 2024-09-20 14:38:10 -07:00
Update chatbot UI and update hallucination check (#218) * update chatbot UI * Update docker-compose for demos * Fix bugs * fix for emtadata (#219) * fix for emtadata * fix * revert * merge main --------- Co-authored-by: CTran <cotran2@utexas.edu> 2024-10-24 14:11:53 -07:00
			`CSS_STYLE = """`
			`.json-container {`
			`height: 95vh !important;`
			`overflow-y: auto !important;`
			`}`
			`.chatbot {`
			`height: calc(95vh - 100px) !important;`
			`overflow-y: auto !important;`
			`}`
			`footer {visibility: hidden}`
			`"""`

lint + formating with black (#158) * lint + formating with black * add black as pre commit 2024-10-09 11:25:07 -07:00			`client = OpenAI(`
llm listener split (#155) 2024-10-09 15:47:32 -07:00			`api_key="--",`
lint + formating with black (#158) * lint + formating with black * add black as pre commit 2024-10-09 11:25:07 -07:00			`base_url=CHAT_COMPLETION_ENDPOINT,`
			`)`

add error warning if open ai key is missing 2024-07-31 15:51:31 -07:00
fix comments 2024-10-28 21:16:53 -07:00			`def chat(query: Optional[str], conversation: Optional[List[Tuple[str, str]]], state):`
lint + formating with black (#158) * lint + formating with black * add black as pre commit 2024-10-09 11:25:07 -07:00			`if "history" not in state:`
			`state["history"] = []`
Update chatbot UI and update hallucination check (#218) * update chatbot UI * Update docker-compose for demos * Fix bugs * fix for emtadata (#219) * fix for emtadata * fix * revert * merge main --------- Co-authored-by: CTran <cotran2@utexas.edu> 2024-10-24 14:11:53 -07:00
don't compute embeddings for names and other fixes see description (#126) * serialize tools - 2 * fix int tests * fix int test * fix unit tests 2024-10-05 19:25:16 -07:00			`history = state.get("history")`
Update chatbot UI and update hallucination check (#218) * update chatbot UI * Update docker-compose for demos * Fix bugs * fix for emtadata (#219) * fix for emtadata * fix * revert * merge main --------- Co-authored-by: CTran <cotran2@utexas.edu> 2024-10-24 14:11:53 -07:00			`history.append({"role": "user", "content": query})`
Pass tool call and app function response back in metadata (#193) 2024-10-18 13:25:39 -07:00			`log.info(f"history: {history}")`
Add support for local llm (mistral 7b) (#31) 2024-08-06 23:40:06 -07:00
Add workflow logic for weather forecast demo (#24) 2024-07-30 16:23:23 -07:00			`try:`
lint + formating with black (#158) * lint + formating with black * add black as pre commit 2024-10-09 11:25:07 -07:00			`raw_response = client.chat.completions.with_raw_response.create(`
llm listener split (#155) 2024-10-09 15:47:32 -07:00			`model="--",`
lint + formating with black (#158) * lint + formating with black * add black as pre commit 2024-10-09 11:25:07 -07:00			`messages=history,`
			`temperature=1.0,`
			`)`
use openai standard response in arch-fc and in gradio client (#62) * use openai standard response in arch-fc and in gradio client also fix code bug in usage * fix int test 2024-09-19 12:19:14 -07:00			`except Exception as e:`
lint + formating with black (#158) * lint + formating with black * add black as pre commit 2024-10-09 11:25:07 -07:00			`history.pop()`
remove streaming for run.py 2024-10-28 23:43:08 -07:00			`# remove last user message in case of exception`
			`log.error("Error calling gateway API: {}".format(e))`
Add support for streaming and fixes few issues (see description) (#202) 2024-10-28 20:05:06 -04:00			`raise gr.Error("Error calling gateway API: {}".format(e))`

remove streaming for run.py 2024-10-28 23:43:08 -07:00			`log.error(f"raw_response: {raw_response.text}")`
			`response = raw_response.parse()`

			`# extract arch_state from metadata and store it in gradio session state`
			`# this state must be passed back to the gateway in the next request`
			`response_json = json.loads(raw_response.text)`
			`log.info(response_json)`

			`arch_messages = get_arch_messages(response_json)`
			`for arch_message in arch_messages:`
			`history.append(arch_message)`

			`content = response.choices[0].message.content`

			`history.append({"role": "assistant", "content": content, "model": response.model})`
Add support for streaming and fixes few issues (see description) (#202) 2024-10-28 20:05:06 -04:00
remove streaming for run.py 2024-10-28 23:43:08 -07:00			`# for gradio UI we don't want to show raw tool calls and messages from developer application`
			`# so we're filtering those out`
			`history_view = [h for h in history if h["role"] != "tool" and "content" in h]`
Add support for streaming and fixes few issues (see description) (#202) 2024-10-28 20:05:06 -04:00
remove streaming for run.py 2024-10-28 23:43:08 -07:00			`conversation = [`
			`(history_view[i]["content"], history_view[i + 1]["content"])`
			`for i in range(0, len(history_view) - 1, 2)`
			`]`
Add support for streaming and fixes few issues (see description) (#202) 2024-10-28 20:05:06 -04:00
remove streaming for run.py 2024-10-28 23:43:08 -07:00			`yield "", conversation, state`
Update chatbot UI and update hallucination check (#218) * update chatbot UI * Update docker-compose for demos * Fix bugs * fix for emtadata (#219) * fix for emtadata * fix * revert * merge main --------- Co-authored-by: CTran <cotran2@utexas.edu> 2024-10-24 14:11:53 -07:00

			`def main():`
			`with gr.Blocks(`
			`theme=gr.themes.Default(`
			`font_mono=[gr.themes.GoogleFont("IBM Plex Mono"), "Arial", "sans-serif"]`
			`),`
			`fill_height=True,`
			`css=CSS_STYLE,`
			`) as demo:`
			`with gr.Row(equal_height=True):`
			`state = gr.State({})`

			`with gr.Column(scale=4):`
			`gr.JSON(`
			`value=get_prompt_targets(),`
			`open=True,`
			`show_indices=False,`
			`label="Available Tools",`
			`scale=1,`
			`min_height="95vh",`
			`elem_classes="json-container",`
			`)`
			`with gr.Column(scale=6):`
			`chatbot = gr.Chatbot(`
			`label="Arch Chatbot",`
			`scale=1,`
			`elem_classes="chatbot",`
			`)`
			`textbox = gr.Textbox(`
			`show_label=False,`
			`placeholder="Enter text and press enter",`
			`scale=1,`
			`autofocus=True,`
			`)`

			`textbox.submit(chat, [textbox, chatbot, state], [textbox, chatbot, state])`

			`demo.launch(server_name="0.0.0.0", server_port=8080, show_error=True, debug=True)`


			`if __name__ == "__main__":`
			`main()`