Update python scripts

2026-06-23 15:38:07 +02:00 · 2025-03-21 09:37:56 -07:00 · 2025-03-21 09:37:56 -07:00 · 20b8739c4f
commit 20b8739c4f
parent 1953860e8c
4 changed files with 33 additions and 6 deletions
--- a/tests/rest/utils/extract_tools_from_system_prompt.py
+++ b/tests/rest/utils/extract_tools_from_system_prompt.py
@ -0,0 +1,21 @@
+import json
+
+
+def extract_tools(system_prompt):
+    l = system_prompt.rfind("<tools>")
+    r = system_prompt.rfind("</tools>")
+
+    if l != -1 and r != -1:
+        tool_content = system_prompt[l + len("<tools>") : r]
+        print(tool_content.split("\n"))
+        tools = [json.loads(tool) for tool in tool_content.split("\n") if tool]
+        return tools
+    else:
+        raise ValueError("Invalid system prompt")
+
+
+if __name__ == "__main__":
+    system_prompt = 'You are a helpful assistant designed to assist with the user query by making one or more function calls if needed.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>\n{"name": "verify_address", "description": "Verify the address", "parameters": {"type": "object", "property_address": {"type": "str", "description": "Complete address of the property", "format": "Street address, City, State Country"}, "required": ["property_address"]}}\n{"name": "track_shipment", "description": "Track the shipment", "parameters": {"type": "object", "properties": {"tracking_number": {"type": "str", "description": "The tracking number"}}, "required": ["tracking_number"]}}\n{"name": "generate_label", "description": "Generate the shipping label", "parameters": {"type": "object", "properties": {"sender": {"type": "str", "description": "The address to ship from"}, "recipient": {"type": "str", "description": "The address to ship to"}, "weight": {"type": "int", "description": "The weight of the package"}}, "required": ["sender", "recipient", "weight"]}}\n{"name": "calculate_shipping_rate", "description": "Calculate the shipping rate", "parameters": {"type": "object", "properties": {"sender": {"type": "str", "description": "The address to ship from"}, "recipient": {"type": "str", "description": "The address to ship to"}, "weight": {"type": "int", "description": "The weight of the package"}}, "required": ["sender", "recipient", "weight"]}}\n</tools>\n\nYour task is to decide which functions are needed and collect missing parameters if necessary.\n\nBased on your analysis, provide your response in one of the following JSON formats:\n1. If no functions are needed:\n```\n{"response": "Your response text here"}\n```\n2. If functions are needed but some required parameters are missing:\n```\n{"required_functions": ["func_name1", "func_name2", ...], "clarification": "Text asking for missing parameters"}\n```\n3. If functions are needed and all required parameters are available:\n```\n{"tool_calls": [{"name": "func_name1", "arguments": {"argument1": "value1", "argument2": "value2"}},... (more tool calls as required)]}\n```'
+
+    tools = extract_tools(system_prompt)
+    print(json.dumps(tools, indent=4))
--- a/tests/rest/utils/generate_observations.py
+++ b/tests/rest/utils/generate_observations.py
@ -0,0 +1,17 @@
+# Use the format `{"name": "function_name", "result": "function_result"}` for each tool call
+tool_call_results = [
+    {"name": "get_weather", "result": "37.1 f"}
+    # {"name": "get_stock_price", "result": "247.66 USD"}
+    # Add more results if needed
+]
+
+
+def build_observations(tool_call_results):
+    observations = "\n".join([repr(x) for x in tool_call_results])
+    observations = f"<tool_response>\n{observations}\n</tool_response>"
+    return observations
+
+
+if __name__ == "__main__":
+    observations = build_observations(tool_call_results)
+    print(repr(observations))
--- a/tests/rest/utils/generate_random_system_prompt.py
+++ b/tests/rest/utils/generate_random_system_prompt.py
@ -0,0 +1,130 @@
+import json
+import random
+
+from datasets import load_dataset
+from typing import Any, Dict, List
+
+
+ARCH_FUNCTION_TOOL_PROMPT = (
+    "You are a helpful assistant designed to assist with the user query by making one or more function calls if needed."
+    "\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>{tool_text}\n</tools>"
+    "\n\nYour task is to decide which functions are needed and collect missing parameters if necessary.\n\n"
+)
+
+ARCH_FUNCTION_FORMAT_PROMPT = """
+Based on your analysis, provide your response in one of the following JSON formats:
+1. If no functions are needed:
+```
+{"response": "Your response text here"}
+```
+2. If functions are needed but some required parameters are missing:
+```
+{"required_functions": ["func_name1", "func_name2", ...], "clarification": "Text asking for missing parameters"}
+```
+3. If functions are needed and all required parameters are available:
+```
+{"tool_calls": [{"name": "func_name1", "arguments": {"argument1": "value1", "argument2": "value2"}},... (more tool calls as required)]}
+```
+""".strip()
+
+
+DATA_TYPE_MAP = {
+    "string": "str",
+    "integer": "int",
+    "boolean": "bool",
+    "number": "float",
+    "array": "list",
+    "Dict": "dict",
+    "List": "list",
+}
+
+
+def process_data_types(param_type):
+    extracted = {"type": [], "optional": False, "default": None}
+
+    param_type = [t.strip() for t in param_type.split(",")]
+
+    for t in param_type:
+        if t.startswith("optional"):
+            if t == "optional":
+                extracted["optional"] = True
+        elif t.startswith("default"):
+            if "=" in t:
+                extracted["default"] = t.split("=")[-1].strip()
+            else:
+                extracted["default"] = t.split(" ")[-1].strip()
+        else:
+            extracted["type"].append(t)
+
+    extracted["type"] = ", ".join(extracted["type"])
+
+    return extracted
+
+
+def convert_tool(tool):
+    converted = {
+        "name": tool["name"],
+        "description": tool["description"],
+        "parameters": {"type": "object", "properties": {}, "required": []},
+    }
+
+    for param_name, param_value in tool["parameters"].items():
+        extracted = process_data_types(param_value["type"])
+
+        if extracted["type"] in DATA_TYPE_MAP:
+            extracted["type"] = DATA_TYPE_MAP[extracted["type"]]
+
+        parameter = {
+            "type": extracted["type"],
+            "description": param_value["description"],
+        }
+
+        if "default" in param_value:
+            parameter["default"] = param_value["default"]
+        elif extracted["default"] is not None:
+            parameter["default"] = extracted["default"]
+
+        if "default" in parameter:
+            if parameter["default"] is None:
+                parameter.pop("default")
+            else:
+                try:
+                    if len(parameter["default"]) == 0:
+                        parameter.pop("default")
+                except Exception:
+                    pass
+
+        converted["parameters"]["properties"][param_name] = parameter
+
+        if not extracted["optional"]:
+            converted["parameters"]["required"].append(param_name)
+
+    return converted
+
+
+def build_system_prompt(tools: List[Dict[str, Any]]) -> str:
+    tool_text = ""
+    for tool in tools:
+        tool_text += "\n" + json.dumps(tool)
+
+    return (
+        ARCH_FUNCTION_TOOL_PROMPT.format(tool_text=tool_text)
+        + ARCH_FUNCTION_FORMAT_PROMPT
+    )
+
+
+if __name__ == "__main__":
+    xlam = load_dataset("Salesforce/xlam-function-calling-60k")
+
+    idx = random.sample(range(len(xlam["train"])), k=1)
+    example = xlam["train"][idx]
+
+    print("=" * 50 + " Tools " + "=" * 50)
+    tools = [convert_tool(tool) for tool in json.loads(example["tools"][0])]
+    print(json.dumps(tools, indent=4))
+
+    print("\n" + "=" * 50 + " System Prompt " + "=" * 50)
+    system_prompt = build_system_prompt(tools)
+
+    # print(repr(system_prompt.encode("unicode_escape").decode()))
+    print(json.dumps(system_prompt))
--- a/tests/rest/utils/generate_system_prompt.py
+++ b/tests/rest/utils/generate_system_prompt.py
@ -0,0 +1,77 @@
+import json
+from typing import Any, Dict, List
+
+
+ARCH_FUNCTION_TOOL_PROMPT = (
+    "You are a helpful assistant designed to assist with the user query by making one or more function calls if needed."
+    "\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>{tool_text}\n</tools>"
+    "\n\nYour task is to decide which functions are needed and collect missing parameters if necessary.\n\n"
+)
+
+ARCH_FUNCTION_FORMAT_PROMPT = """
+Based on your analysis, provide your response in one of the following JSON formats:
+1. If no functions are needed:
+```
+{"response": "Your response text here"}
+```
+2. If functions are needed but some required parameters are missing:
+```
+{"required_functions": ["func_name1", "func_name2", ...], "clarification": "Text asking for missing parameters"}
+```
+3. If functions are needed and all required parameters are available:
+```
+{"tool_calls": [{"name": "func_name1", "arguments": {"argument1": "value1", "argument2": "value2"}},... (more tool calls as required)]}
+```
+""".strip()
+
+
+tools = [
+    {
+        "name": "get_weather",
+        "description": "Retrieves current weather for the given location.",
+        "parameters": {
+            "type": "object",
+            "properties": {
+                "location": {
+                    "type": "str",
+                    "description": "City and country e.g. Bogotá, Colombia",
+                },
+                "units": {
+                    "type": "str",
+                    "enum": ["celsius", "fahrenheit"],
+                    "description": "Units the temperature will be returned in.",
+                },
+            },
+            "required": ["location", "units"],
+        },
+    },
+    {
+        "name": "get_stock_price",
+        "description": "Get the current stock price",
+        "parameters": {
+            "type": "object",
+            "properties": {
+                "symbol": {"type": "str", "description": "The stock symbol"}
+            },
+            "required": ["symbol"],
+        },
+    },
+]
+
+
+def build_system_prompt(tools: List[Dict[str, Any]]) -> str:
+    tool_text = ""
+    for tool in tools:
+        tool_text += "\n" + json.dumps(tool)
+
+    return (
+        ARCH_FUNCTION_TOOL_PROMPT.format(tool_text=tool_text)
+        + ARCH_FUNCTION_FORMAT_PROMPT
+    )
+
+
+if __name__ == "__main__":
+    system_prompt = build_system_prompt(tools)
+
+    # print(repr(system_prompt.encode("unicode_escape").decode()))
+    print(json.dumps(system_prompt))