add test for ml_engineer.

2026-06-11 15:15:18 +02:00 · 2023-12-21 10:11:07 +08:00 · 2023-12-21 10:11:07 +08:00 · a39cc30164
commit a39cc30164
parent 5af4f6b4c5
1 changed files with 36 additions and 0 deletions
--- a/tests/metagpt/roles/test_daml.py
+++ b/tests/metagpt/roles/test_daml.py
@ -0,0 +1,36 @@
+import pytest
+from tqdm import tqdm
+
+from metagpt.logs import logger
+from metagpt.roles.ml_engineer import MLEngineer
+
+
+async def make_use_tools(requirement: str, auto_run: bool = True):
+    """make and use tools for requirement."""
+    role = MLEngineer(goal=requirement, auto_run=auto_run)
+    # make udfs
+    role.make_udfs = True
+    role.use_udfs = False
+    await role.run(requirement)
+    # use udfs
+    role.reset()
+    role.make_udfs = False
+    role.use_udfs = True
+    await role.run(requirement)
+
+
+@pytest.mark.asyncio
+async def test_make_use_tools():
+    requirements = ["Run data analysis on sklearn Iris dataset, include a plot",
+                    "Run data analysis on sklearn Diabetes dataset, include a plot",
+                    "Run data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy",
+                    "Run data analysis on sklearn Wisconsin Breast Cancer dataset, include a plot, train a model to predict targets (20% as validation), and show validation accuracy",
+                    "Run EDA and visualization on this dataset, train a model to predict survival, report metrics on validation set (20%), dataset: tests/data/titanic.csv"]
+    success = 0
+    for requirement in tqdm(requirements, total=len(requirements)):
+        try:
+            await make_use_tools(requirement)
+            success += 1
+        except Exception as e:
+            logger.error(f"Found Error in {requirement}, {e}")
+    logger.info(f"success: {round(success/len(requirements), 1)*100}%")