diff --git a/metagpt/actions/clone_function.py b/metagpt/actions/clone_function.py deleted file mode 100644 index 7053df97b..000000000 --- a/metagpt/actions/clone_function.py +++ /dev/null @@ -1,67 +0,0 @@ -from pathlib import Path - -from pydantic import Field - -from metagpt.actions.write_code import WriteCode -from metagpt.llm import LLM -from metagpt.logs import logger -from metagpt.provider.base_llm import BaseLLM -from metagpt.schema import Message -from metagpt.utils.exceptions import handle_exception -from metagpt.utils.highlight import highlight - -CLONE_PROMPT = """ -*context* -Please convert the function code ```{source_code}``` into the the function format: ```{template_func}```. -*Please Write code based on the following list and context* -1. Write code start with ```, and end with ```. -2. Please implement it in one function if possible, except for import statements. for exmaple: -```python -import pandas as pd -def run(*args) -> pd.DataFrame: - ... -``` -3. Do not use public member functions that do not exist in your design. -4. The output function name, input parameters and return value must be the same as ```{template_func}```. -5. Make sure the results before and after the code conversion are required to be exactly the same. -6. Don't repeat my context in your replies. -7. Return full results, for example, if the return value has df.head(), please return df. -8. If you must use a third-party package, use the most popular ones, for example: pandas, numpy, ta, ... -""" - - -class CloneFunction(WriteCode): - name: str = "CloneFunction" - context: list[Message] = [] - llm: BaseLLM = Field(default_factory=LLM) - - def _save(self, code_path, code): - if isinstance(code_path, str): - code_path = Path(code_path) - code_path.parent.mkdir(parents=True, exist_ok=True) - code_path.write_text(code, encoding="utf-8") - logger.info(f"Saving Code to {code_path}") - - async def run(self, template_func: str, source_code: str) -> str: - """将source_code转换成template_func一样的入参和返回类型""" - prompt = CLONE_PROMPT.format(source_code=source_code, template_func=template_func) - logger.info(f"query for CloneFunction: \n {prompt}") - code = await self.write_code(prompt) - logger.info(f"CloneFunction code is \n {highlight(code)}") - return code - - -@handle_exception -def run_function_code(func_code: str, func_name: str, *args, **kwargs): - """Run function code from string code.""" - locals_ = {} - exec(func_code, locals_) - func = locals_[func_name] - return func(*args, **kwargs), "" - - -def run_function_script(code_script_path: str, func_name: str, *args, **kwargs): - """Run function code from script.""" - code_path = Path(code_script_path) - code = code_path.read_text(encoding="utf-8") - return run_function_code(code, func_name, *args, **kwargs) diff --git a/metagpt/tools/code_interpreter.py b/metagpt/tools/code_interpreter.py deleted file mode 100644 index 9575d6c13..000000000 --- a/metagpt/tools/code_interpreter.py +++ /dev/null @@ -1,197 +0,0 @@ -import inspect -import re -import textwrap -from pathlib import Path -from typing import Callable, Dict, List - -import wrapt -from interpreter.core.core import Interpreter - -from metagpt.actions.clone_function import ( - CloneFunction, - run_function_code, - run_function_script, -) -from metagpt.config import CONFIG -from metagpt.logs import logger -from metagpt.utils.highlight import highlight - - -def extract_python_code(code: str): - """Extract code blocks: If the code comments are the same, only the last code block is kept.""" - # Use regular expressions to match comment blocks and related code. - pattern = r"(#\s[^\n]*)\n(.*?)(?=\n\s*#|$)" - matches = re.findall(pattern, code, re.DOTALL) - - # Extract the last code block when encountering the same comment. - unique_comments = {} - for comment, code_block in matches: - unique_comments[comment] = code_block - - # concatenate into functional form - result_code = "\n".join([f"{comment}\n{code_block}" for comment, code_block in unique_comments.items()]) - header_code = code[: code.find("#")] - code = header_code + result_code - - logger.info(f"Extract python code: \n {highlight(code)}") - - return code - - -class OpenCodeInterpreter(object): - """https://github.com/KillianLucas/open-interpreter""" - - def __init__(self, auto_run: bool = True) -> None: - interpreter = Interpreter() - interpreter.auto_run = auto_run - interpreter.model = CONFIG.openai_api_model or "gpt-3.5-turbo" - interpreter.api_key = CONFIG.openai_api_key - self.interpreter = interpreter - - def chat(self, query: str, reset: bool = True): - if reset: - self.interpreter.reset() - return self.interpreter.chat(query) - - @staticmethod - def extract_function( - query_respond: List, function_name: str, *, language: str = "python", function_format: str = None - ) -> str: - """create a function from query_respond.""" - if language not in ("python"): - raise NotImplementedError(f"Not support to parse language {language}!") - - # set function form - if function_format is None: - assert language == "python", f"Expect python language for default function_format, but got {language}." - function_format = """def {function_name}():\n{code}""" - # Extract the code module in the open-interpreter respond message. - # The query_respond of open-interpreter before v0.1.4 is: - # [{'role': 'user', 'content': your query string}, - # {'role': 'assistant', 'content': plan from llm, 'function_call': { - # "name": "run_code", "arguments": "{"language": "python", "code": code of first plan}, - # "parsed_arguments": {"language": "python", "code": code of first plan} - # ...] - if "function_call" in query_respond[1]: - code = [ - item["function_call"]["parsed_arguments"]["code"] - for item in query_respond - if "function_call" in item - and "parsed_arguments" in item["function_call"] - and "language" in item["function_call"]["parsed_arguments"] - and item["function_call"]["parsed_arguments"]["language"] == language - ] - # The query_respond of open-interpreter v0.1.7 is: - # [{'role': 'user', 'message': your query string}, - # {'role': 'assistant', 'message': plan from llm, 'language': 'python', - # 'code': code of first plan, 'output': output of first plan code}, - # ...] - elif "code" in query_respond[1]: - code = [ - item["code"] - for item in query_respond - if "code" in item and "language" in item and item["language"] == language - ] - else: - raise ValueError(f"Unexpect message format in query_respond: {query_respond[1].keys()}") - # add indent. - indented_code_str = textwrap.indent("\n".join(code), " " * 4) - # Return the code after deduplication. - if language == "python": - return extract_python_code(function_format.format(function_name=function_name, code=indented_code_str)) - - -def gen_query(func: Callable, args, kwargs) -> str: - # Get the annotation of the function as part of the query. - desc = func.__doc__ - signature = inspect.signature(func) - # Get the signature of the wrapped function and the assignment of the input parameters as part of the query. - bound_args = signature.bind(*args, **kwargs) - bound_args.apply_defaults() - query = f"{desc}, {bound_args.arguments}, If you must use a third-party package, use the most popular ones, for example: pandas, numpy, ta, ..." - return query - - -def gen_template_fun(func: Callable) -> str: - return f"def {func.__name__}{str(inspect.signature(func))}\n # here is your code ..." - - -class OpenInterpreterDecorator(object): - def __init__(self, save_code: bool = False, code_file_path: str = None, clear_code: bool = False) -> None: - self.save_code = save_code - self.code_file_path = code_file_path - self.clear_code = clear_code - - def _have_code(self, rsp: List[Dict]): - # Is there any code generated? - return "code" in rsp[1] and rsp[1]["code"] not in ("", None) - - def _is_faild_plan(self, rsp: List[Dict]): - # is faild plan? - func_code = OpenCodeInterpreter.extract_function(rsp, "function") - # If there is no more than 1 '\n', the plan execution fails. - if isinstance(func_code, str) and func_code.count("\n") <= 1: - return True - return False - - def _check_respond(self, query: str, interpreter: OpenCodeInterpreter, respond: List[Dict], max_try: int = 3): - for _ in range(max_try): - # TODO: If no code or faild plan is generated, execute chat again, repeating no more than max_try times. - if self._have_code(respond) and not self._is_faild_plan(respond): - break - elif not self._have_code(respond): - logger.warning(f"llm did not return executable code, resend the query: \n{query}") - respond = interpreter.chat(query) - elif self._is_faild_plan(respond): - logger.warning(f"llm did not generate successful plan, resend the query: \n{query}") - respond = interpreter.chat(query) - - # Post-processing of respond - if not self._have_code(respond): - error_msg = f"OpenCodeInterpreter do not generate code for query: \n{query}" - logger.error(error_msg) - raise ValueError(error_msg) - - if self._is_faild_plan(respond): - error_msg = f"OpenCodeInterpreter do not generate code for query: \n{query}" - logger.error(error_msg) - raise ValueError(error_msg) - return respond - - def __call__(self, wrapped): - @wrapt.decorator - async def wrapper(wrapped: Callable, instance, args, kwargs): - # Get the decorated function name. - func_name = wrapped.__name__ - # If the script exists locally and clearcode is not required, execute the function from the script. - if self.code_file_path and Path(self.code_file_path).is_file() and not self.clear_code: - return run_function_script(self.code_file_path, func_name, *args, **kwargs) - - # Auto run generate code by using open-interpreter. - interpreter = OpenCodeInterpreter() - query = gen_query(wrapped, args, kwargs) - logger.info(f"query for OpenCodeInterpreter: \n {query}") - respond = interpreter.chat(query) - # Make sure the response is as expected. - respond = self._check_respond(query, interpreter, respond, 3) - # Assemble the code blocks generated by open-interpreter into a function without parameters. - func_code = interpreter.extract_function(respond, func_name) - # Clone the `func_code` into wrapped, that is, - # keep the `func_code` and wrapped functions with the same input parameter and return value types. - template_func = gen_template_fun(wrapped) - cf = CloneFunction() - code = await cf.run(template_func=template_func, source_code=func_code) - # Display the generated function in the terminal. - logger_code = highlight(code, "python") - logger.info(f"Creating following Python function:\n{logger_code}") - # execute this function. - try: - res = run_function_code(code, func_name, *args, **kwargs) - if self.save_code and self.code_file_path: - cf._save(self.code_file_path, code) - except Exception as e: - logger.error(f"Could not evaluate Python code \n{logger_code}: \nError: {e}") - raise Exception("Could not evaluate Python code", e) - return res - - return wrapper(wrapped) diff --git a/tests/metagpt/tools/test_code_interpreter.py b/tests/metagpt/tools/test_code_interpreter.py deleted file mode 100644 index 792f7b05b..000000000 --- a/tests/metagpt/tools/test_code_interpreter.py +++ /dev/null @@ -1,43 +0,0 @@ -# from pathlib import Path -# -# import pandas as pd -# import pytest -# -# from metagpt.actions import Action -# from metagpt.logs import logger -# from metagpt.tools.code_interpreter import OpenCodeInterpreter, OpenInterpreterDecorator -# -# logger.add("./tests/data/test_ci.log") -# stock = "./tests/data/baba_stock.csv" -# -# -# # TODO: 需要一种表格数据格式,能够支持schame管理的,标注字段类型和字段含义。 -# class CreateStockIndicators(Action): -# @OpenInterpreterDecorator(save_code=True, code_file_path="./tests/data/stock_indicators.py") -# async def run(self, stock_path: str, indicators=["Simple Moving Average", "BollingerBands"]) -> pd.DataFrame: -# """对stock_path中的股票数据, 使用pandas和ta计算indicators中的技术指标, 返回带有技术指标的股票数据,不需要去除空值, 不需要安装任何包; -# 指标生成对应的三列: SMA, BB_upper, BB_lower -# """ -# ... -# -# -# @pytest.mark.asyncio -# async def test_actions(): -# # 计算指标 -# indicators = ["Simple Moving Average", "BollingerBands"] -# stocker = CreateStockIndicators() -# df, msg = await stocker.run(stock, indicators=indicators) -# assert isinstance(df, pd.DataFrame) -# assert "Close" in df.columns -# assert "Date" in df.columns -# # 将df保存为文件,将文件路径传入到下一个action -# df_path = "./tests/data/stock_indicators.csv" -# df.to_csv(df_path) -# assert Path(df_path).is_file() -# # 可视化指标结果 -# figure_path = "./tests/data/figure_ci.png" -# ci_ploter = OpenCodeInterpreter() -# ci_ploter.chat( -# f"使用seaborn对{df_path}中与股票布林带有关的数据列的Date, Close, SMA, BB_upper(布林带上界), BB_lower(布林带下界)进行可视化, 可视化图片保存在{figure_path}中。不需要任何指标计算,把Date列转换为日期类型。要求图片优美,BB_upper, BB_lower之间使用合适的颜色填充。" -# ) -# assert Path(figure_path).is_file()