From 72e550b148927ea7c58b989a5f80fde79dfc713e Mon Sep 17 00:00:00 2001
From: yzlin <yzlin@fuzhi.ai>
Date: Wed, 20 Dec 2023 15:39:18 +0800
Subject: [PATCH] minor update: move action, fix circular import, add entry
 parameters

---
 metagpt/actions/ml_da_action.py | 18 +++++++++++++--
 metagpt/roles/ml_engineer.py    | 40 ++++++++-------------------------
 metagpt/utils/recovery_util.py  |  3 +--
 3 files changed, 26 insertions(+), 35 deletions(-)

diff --git a/metagpt/actions/ml_da_action.py b/metagpt/actions/ml_da_action.py
index 5e4580b17..b6270f12f 100644
--- a/metagpt/actions/ml_da_action.py
+++ b/metagpt/actions/ml_da_action.py
@@ -3,9 +3,12 @@ from typing import Dict, List, Union
 
 from metagpt.actions import Action
 from metagpt.schema import Message, Plan
-from metagpt.utils.common import CodeParser
+from metagpt.utils.common import CodeParser, remove_comments, create_func_config
 from metagpt.logs import logger
-
+from metagpt.prompts.ml_engineer import (
+    UPDATE_DATA_COLUMNS,
+    PRINT_DATA_COLUMNS
+)
 
 class ReviewConst:
     TASK_REVIEW_TRIGGER = "task"
@@ -114,3 +117,14 @@ class Reflect(Action):
         rsp = CodeParser.parse_code(block=None, text=rsp_json)
         reflection = json.loads(rsp)["reflection"]
         return reflection
+
+
+class UpdateDataColumns(Action):
+    async def run(self, plan: Plan = None) -> dict:
+        finished_tasks = plan.get_finished_tasks()
+        code_context = [remove_comments(task.code) for task in finished_tasks]
+        code_context = "\n\n".join(code_context)
+        prompt = UPDATE_DATA_COLUMNS.format(history_code=code_context)
+        tool_config = create_func_config(PRINT_DATA_COLUMNS)
+        rsp = await self.llm.aask_code(prompt, **tool_config)
+        return rsp
diff --git a/metagpt/roles/ml_engineer.py b/metagpt/roles/ml_engineer.py
index 33b570d1a..73aba1fe8 100644
--- a/metagpt/roles/ml_engineer.py
+++ b/metagpt/roles/ml_engineer.py
@@ -4,10 +4,9 @@ from datetime import datetime
 
 import fire
 
-from metagpt.actions import Action
 from metagpt.actions.debug_code import DebugCode
 from metagpt.actions.execute_code import ExecutePyCode
-from metagpt.actions.ml_da_action import AskReview, SummarizeAnalysis, Reflect, ReviewConst
+from metagpt.actions.ml_da_action import AskReview, SummarizeAnalysis, Reflect, ReviewConst, UpdateDataColumns
 from metagpt.actions.write_analysis_code import WriteCodeByGenerate, WriteCodeWithTools
 from metagpt.actions.write_code_steps import WriteCodeSteps
 from metagpt.actions.write_plan import WritePlan
@@ -16,42 +15,26 @@ from metagpt.const import DATA_PATH, PROJECT_ROOT
 from metagpt.logs import logger
 from metagpt.memory import Memory
 from metagpt.prompts.ml_engineer import STRUCTURAL_CONTEXT
-from metagpt.prompts.ml_engineer import (
-    UPDATE_DATA_COLUMNS,
-    PRINT_DATA_COLUMNS
-)
 from metagpt.roles import Role
 from metagpt.roles.kaggle_manager import DownloadData, SubmitResult
 from metagpt.schema import Message, Plan
-from metagpt.utils.common import remove_comments, create_func_config
 from metagpt.utils.save_code import save_code_file
 from metagpt.utils.recovery_util import save_history, load_history
 
 
-class UpdateDataColumns(Action):
-    async def run(self, plan: Plan = None) -> dict:
-        finished_tasks = plan.get_finished_tasks()
-        code_context = [remove_comments(task.code) for task in finished_tasks]
-        code_context = "\n\n".join(code_context)
-        prompt = UPDATE_DATA_COLUMNS.format(history_code=code_context)
-        tool_config = create_func_config(PRINT_DATA_COLUMNS)
-        rsp = await self.llm.aask_code(prompt, **tool_config)
-        return rsp
-
-
 class MLEngineer(Role):
     def __init__(
-        self, name="ABC", profile="MLEngineer", goal="", auto_run: bool = False
+        self, name="ABC", profile="MLEngineer", goal="", auto_run: bool = False, use_tools=False, use_code_steps=False,
     ):
         super().__init__(name=name, profile=profile, goal=goal)
         self._set_react_mode(react_mode="plan_and_act")
         self._watch([DownloadData, SubmitResult])
         
         self.plan = Plan(goal=goal)
-        self.use_tools = True
-        self.use_code_steps = True
         self.execute_code = ExecutePyCode()
         self.auto_run = auto_run
+        self.use_tools = use_tools
+        self.use_code_steps = use_code_steps
         self.data_desc = {}
         
         # memory for working on each task, discarded each time a task is done
@@ -277,7 +260,6 @@ if __name__ == "__main__":
     # requirement = "Run data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy"
     # requirement = "Run data analysis on sklearn Wisconsin Breast Cancer dataset, include a plot, train a model to predict targets (20% as validation), and show validation accuracy"
     # requirement = "Run EDA and visualization on this dataset, train a model to predict survival, report metrics on validation set (20%), dataset: workspace/titanic/train.csv"
-    
     # requirement = "Perform data analysis on the provided data. Train a model to predict the target variable Survived. Include data preprocessing, feature engineering, and modeling in your pipeline. The metric is accuracy."
     
     # data_path = f"{DATA_PATH}/titanic"
@@ -291,13 +273,10 @@ if __name__ == "__main__":
     
     data_path = f"{DATA_PATH}/house-prices-advanced-regression-techniques"
     requirement = f"This is a house price dataset, your goal is to predict the sale price of a property based on its features. The target column is SalePrice. Perform data analysis, data preprocessing, feature engineering, and modeling to predict the target. Report RMSE between the logarithm of the predicted value and the logarithm of the observed sales price on the eval data. Train data path: '{data_path}/split_train.csv', eval data path: '{data_path}/split_eval.csv'."
-    
     save_dir = ""
-    
-    
     # save_dir = DATA_PATH / "output" / "2023-12-14_20-40-34"
-    
-    async def main(requirement: str = requirement, auto_run: bool = True, save_dir: str = save_dir):
+
+    async def main(requirement: str = requirement, auto_run: bool = True, use_tools: bool = False, use_code_steps: bool = False, save_dir: str = ""):
         """
         The main function to run the MLEngineer with optional history loading.
 
@@ -312,13 +291,13 @@ if __name__ == "__main__":
         if save_dir:
             logger.info("Resuming from history trajectory")
             plan, nb = load_history(save_dir)
-            role = MLEngineer(goal=requirement, auto_run=auto_run)
+            role = MLEngineer(goal=requirement, auto_run=auto_run, use_tools=use_tools, use_code_steps=use_code_steps)
             role.plan = Plan(**plan)
             role.execute_code = ExecutePyCode(nb)
         
         else:
             logger.info("Run from scratch")
-            role = MLEngineer(goal=requirement, auto_run=auto_run)
+            role = MLEngineer(goal=requirement, auto_run=auto_run, use_tools=use_tools, use_code_steps=use_code_steps)
         
         try:
             await role.run(requirement)
@@ -327,6 +306,5 @@ if __name__ == "__main__":
             save_path = save_history(role, save_dir)
             
             logger.exception(f"An error occurred: {e}, save trajectory here: {save_path}")
-    
-    
+
     fire.Fire(main)
diff --git a/metagpt/utils/recovery_util.py b/metagpt/utils/recovery_util.py
index ef4f0aca7..afe7fc021 100644
--- a/metagpt/utils/recovery_util.py
+++ b/metagpt/utils/recovery_util.py
@@ -8,7 +8,6 @@ import json
 from datetime import datetime
 
 from metagpt.roles.role import Role
-from metagpt.roles.ml_engineer import MLEngineer
 from metagpt.const import DATA_PATH
 from metagpt.utils.save_code import save_code_file
 
@@ -30,7 +29,7 @@ def load_history(save_dir: str = ""):
     return plan, nb
 
 
-def save_history(role: Role = MLEngineer, save_dir: str = ""):
+def save_history(role: Role, save_dir: str = ""):
     """
     Save history to the specified directory.