mirror of
https://github.com/FoundationAgents/MetaGPT.git
synced 2026-06-08 15:05:17 +02:00
engineer2 first draft, allow fine-grained tool reg, reg plan as tool
This commit is contained in:
parent
e54cc424e8
commit
8df76ce612
4 changed files with 318 additions and 8 deletions
49
metagpt/prompts/di/engineer2.py
Normal file
49
metagpt/prompts/di/engineer2.py
Normal file
|
|
@ -0,0 +1,49 @@
|
|||
CMD_PROMPT = """
|
||||
# Data Structure
|
||||
class Task(BaseModel):
|
||||
task_id: str = ""
|
||||
dependent_task_ids: list[str] = []
|
||||
instruction: str = ""
|
||||
task_type: str = ""
|
||||
assignee: str = "David"
|
||||
|
||||
# Available Commands
|
||||
{available_commands}
|
||||
Special Command: Use {{"command_name": "Common.pass"}} to do nothing and {{"command_name": "Common.end"}} to indicate completion of all requirements and the end of actions.
|
||||
|
||||
# Current Plan
|
||||
{plan_status}
|
||||
|
||||
# Current Task
|
||||
{current_task}
|
||||
|
||||
# Example
|
||||
{example}
|
||||
|
||||
# Instructions
|
||||
Based on the context, write a plan or modify an existing plan to achieve the goal. A plan consists of one to 3 tasks.
|
||||
If plan is created, you should track the progress and update the plan accordingly, such as Plan.finish_current_task, Plan.append_task, Plan.reset_task, Plan.replace_task, etc.
|
||||
When presented a current task, tackle the task using the available commands.
|
||||
Pay close attention to new user message, review the conversation history, use MGXEnv.reply_to_human to respond to new user requirement.
|
||||
Note:
|
||||
1. If you keeping encountering errors, unexpected situation, or you are not sure of proceeding, use MGXEnv.ask_human to ask for help.
|
||||
2. Carefully review your progress at the current task, if your actions so far has not fulfilled the task instruction, you should continue with current task. Otherwise, finish current task.
|
||||
3. Each time you finish a task, use MGXEnv.reply_to_human to report your progress.
|
||||
4. Each time you write a code in your response, write with the Editor directly without preparing a repetitive code block beforehand.
|
||||
Pay close attention to the Example provided, you can reuse the example for your current situation if it fits.
|
||||
|
||||
You may use any of the available commands to create a plan or update the plan. You may output mutiple commands, they will be executed sequentially.
|
||||
If you finish current task, you will automatically take the next task in the existing plan, use Plan.finish_task, DON'T append a new task.
|
||||
|
||||
# Your commands in a json array, in the following output format, always output ONE and ONLY ONE json array, if there is nothing to do, use the pass command:
|
||||
Some text indicating your thoughts, such as how you should update the plan status, respond to inquiry, or seek for help. Then a json array of commands.
|
||||
```json
|
||||
[
|
||||
{{
|
||||
"command_name": str,
|
||||
"args": {{"arg_name": arg_value, ...}}
|
||||
}},
|
||||
...
|
||||
]
|
||||
```
|
||||
"""
|
||||
218
metagpt/roles/di/engineer2.py
Normal file
218
metagpt/roles/di/engineer2.py
Normal file
|
|
@ -0,0 +1,218 @@
|
|||
from __future__ import annotations
|
||||
|
||||
import asyncio
|
||||
import json
|
||||
import traceback
|
||||
from typing import Literal
|
||||
|
||||
from pydantic import model_validator
|
||||
|
||||
from metagpt.actions import Action
|
||||
from metagpt.actions.di.write_analysis_code import WriteAnalysisCode
|
||||
from metagpt.logs import logger
|
||||
from metagpt.prompts.di.engineer2 import CMD_PROMPT
|
||||
from metagpt.roles.di.data_interpreter import DataInterpreter
|
||||
from metagpt.schema import Message, TaskResult
|
||||
from metagpt.strategy.experience_retriever import KeywordExpRetriever
|
||||
from metagpt.strategy.planner import Planner
|
||||
from metagpt.tools.libs.editor import Editor
|
||||
from metagpt.tools.tool_recommend import BM25ToolRecommender
|
||||
from metagpt.utils.common import CodeParser
|
||||
from test3 import design_doc_2048, design_doc_snake, task_doc_2048, task_doc_snake
|
||||
|
||||
|
||||
class Engineer2(DataInterpreter):
|
||||
name: str = "Alex"
|
||||
profile: str = "Engineer"
|
||||
goal: str = ""
|
||||
react_mode: Literal["react"] = "react"
|
||||
max_react_loop: int = 20 # used for react mode
|
||||
# task_result: TaskResult = None
|
||||
command_rsp: str = "" # the raw string containing the commands
|
||||
commands: list[dict] = [] # commands to be executed
|
||||
editor: Editor = Editor()
|
||||
|
||||
@model_validator(mode="after")
|
||||
def set_plan_and_tool(self) -> "DataInterpreter":
|
||||
# We force using this parameter for DataAnalyst
|
||||
assert self.react_mode == "react"
|
||||
assert self.auto_run
|
||||
assert self.use_plan
|
||||
|
||||
# Roughly the same part as DataInterpreter.set_plan_and_tool
|
||||
self._set_react_mode(react_mode=self.react_mode, max_react_loop=self.max_react_loop, auto_run=self.auto_run)
|
||||
if self.tools and not self.tool_recommender:
|
||||
self.tool_recommender = BM25ToolRecommender(tools=self.tools, force=True)
|
||||
self.set_actions([WriteAnalysisCode])
|
||||
self._set_state(0)
|
||||
|
||||
# HACK: Init Planner, control it through dynamic thinking; Consider formalizing as a react mode
|
||||
self.planner = Planner(goal="", working_memory=self.rc.working_memory, auto_run=True)
|
||||
|
||||
return self
|
||||
|
||||
async def _think(self) -> bool:
|
||||
"""Useful in 'react' mode. Use LLM to decide whether and what to do next."""
|
||||
if not self.rc.todo and not self.rc.news:
|
||||
return False
|
||||
|
||||
self._set_state(0)
|
||||
example = ""
|
||||
if not self.planner.plan.goal:
|
||||
self.user_requirement = self.get_memories()[-1].content
|
||||
self.planner.plan.goal = self.user_requirement
|
||||
example = KeywordExpRetriever().retrieve(self.user_requirement)
|
||||
else:
|
||||
# self.working_memory.add_batch(self.rc.news)
|
||||
self.rc.memory.add_batch(self.rc.news)
|
||||
# TODO: implement experience retrieval in multi-round setting
|
||||
# if self.planner.plan.current_task:
|
||||
# experience = KeywordExpRetriever().retrieve(self.planner.plan.current_task.instruction, exp_type="task")
|
||||
# if experience and experience not in [msg.content for msg in self.rc.memory.get()]:
|
||||
# exp_msg = Message(content=experience, role="assistant")
|
||||
# self.rc.memory.add(exp_msg)
|
||||
# example = KeywordExpRetriever().retrieve(self.planner.plan.current_task.instruction, exp_type="task")
|
||||
|
||||
plan_status = self.planner.plan.model_dump(include=["goal", "tasks"])
|
||||
for task in plan_status["tasks"]:
|
||||
task.pop("code")
|
||||
task.pop("result")
|
||||
task.pop("is_success")
|
||||
# print(plan_status)
|
||||
current_task = (
|
||||
self.planner.plan.current_task.model_dump(exclude=["code", "result", "is_success"])
|
||||
if self.planner.plan.current_task
|
||||
else ""
|
||||
)
|
||||
|
||||
tools = await self.tool_recommender.recommend_tools()
|
||||
tool_info = json.dumps({tool.name: tool.schemas for tool in tools})
|
||||
prompt = CMD_PROMPT.format(
|
||||
plan_status=plan_status,
|
||||
current_task=current_task,
|
||||
example=example,
|
||||
# available_commands=prepare_command_prompt(self.available_commands),
|
||||
available_commands=tool_info,
|
||||
)
|
||||
# context = self.llm.format_msg(self.working_memory.get() + [Message(content=prompt, role="user")])
|
||||
context = self.llm.format_msg(self.rc.memory.get(10) + [Message(content=prompt, role="user")])
|
||||
|
||||
print(*context, sep="\n" + "*" * 5 + "\n")
|
||||
|
||||
self.command_rsp = await self.llm.aask(context)
|
||||
|
||||
# self.rc.working_memory.add(Message(content=rsp, role="assistant"))
|
||||
self.rc.memory.add(Message(content=self.command_rsp, role="assistant"))
|
||||
|
||||
return True
|
||||
|
||||
async def _act(self) -> Message:
|
||||
try:
|
||||
commands = json.loads(CodeParser.parse_code(block=None, lang="json", text=self.command_rsp))
|
||||
except Exception as e:
|
||||
tb = traceback.format_exc()
|
||||
print(tb)
|
||||
error_msg = Message(content=str(e), role="user")
|
||||
self.rc.memory.add(error_msg)
|
||||
return error_msg
|
||||
outputs = await self.run_commands(commands)
|
||||
# self.rc.working_memory.add(Message(content=outputs, role="user"))
|
||||
self.rc.memory.add(Message(content=outputs, role="user"))
|
||||
return Message(content="Task completed", role="assistant", sent_from=self._setting, cause_by=WriteAnalysisCode)
|
||||
|
||||
async def _react(self) -> Message:
|
||||
actions_taken = 0
|
||||
rsp = Message(content="No actions taken yet", cause_by=Action) # will be overwritten after Role _act
|
||||
while actions_taken < self.rc.max_react_loop:
|
||||
# NOTE: difference here, keep observing within react
|
||||
await self._observe()
|
||||
# think
|
||||
has_todo = await self._think()
|
||||
if not has_todo:
|
||||
break
|
||||
# act
|
||||
logger.debug(f"{self._setting}: {self.rc.state=}, will do {self.rc.todo}")
|
||||
rsp = await self._act()
|
||||
actions_taken += 1
|
||||
return rsp # return output from the last action
|
||||
|
||||
async def run_commands(self, commands) -> list:
|
||||
tool_execute_map = {
|
||||
"Plan.append_task": self.planner.plan.append_task,
|
||||
"Plan.reset_task": self.planner.plan.reset_task,
|
||||
"Plan.replace_task": self.planner.plan.replace_task,
|
||||
"Editor.write": self.editor.write,
|
||||
"Editor.write_content": self.editor.write_content,
|
||||
"Editor.read": self.editor.read,
|
||||
}
|
||||
|
||||
# print(*commands, sep="\n")
|
||||
|
||||
is_success = True
|
||||
outputs = ["Commands executed."]
|
||||
for cmd in commands:
|
||||
if cmd["command_name"] in tool_execute_map:
|
||||
try:
|
||||
output = tool_execute_map[cmd["command_name"]](**cmd["args"])
|
||||
if output:
|
||||
outputs.append(f"Output for {cmd['command_name']}: {str(output)}")
|
||||
except Exception as e:
|
||||
tb = traceback.format_exc()
|
||||
print(e, tb)
|
||||
outputs.append(tb)
|
||||
is_success = False
|
||||
break # Stop executing if any command fails
|
||||
outputs = "\n\n".join(outputs)
|
||||
|
||||
# Handle finish_current_task and end individually as a last step
|
||||
for cmd in commands:
|
||||
if (
|
||||
is_success
|
||||
and cmd["command_name"] == "Plan.finish_current_task"
|
||||
and not self.planner.plan.is_plan_finished()
|
||||
):
|
||||
task_result = TaskResult(code=str(commands), result=outputs, is_success=is_success)
|
||||
self.planner.plan.current_task.update_task_result(task_result=task_result)
|
||||
self.planner.plan.finish_current_task()
|
||||
# self.rc.working_memory.clear()
|
||||
|
||||
elif cmd["command_name"] == "Common.end":
|
||||
self._set_state(-1)
|
||||
|
||||
return outputs
|
||||
|
||||
|
||||
WINE_REQ = "Run data analysis on sklearn Wine recognition dataset, and train a model to predict wine class (20% as validation), and show validation accuracy."
|
||||
|
||||
GAME_REQ_2048 = f"""
|
||||
Create a 2048 game, follow the design doc and task doc. Write your code under /Users/gary/Files/temp/workspace/2048_game/src.
|
||||
After writing all codes, write a code review for the codes, make improvement or adjustment based on the review.
|
||||
Notice: You MUST implement the full code, don't leave comment without implementation!
|
||||
Design doc:
|
||||
{task_doc_2048}
|
||||
Task doc:
|
||||
{design_doc_2048}
|
||||
"""
|
||||
GAME_REQ_SNAKE = f"""
|
||||
Create a snake game, follow the design doc and task doc. Write your code under /Users/gary/Files/temp/workspace/snake_game/src.
|
||||
After writing all codes, write a code review for the codes, make improvement or adjustment based on the review.
|
||||
Notice: You MUST implement the full code, don't leave comment without implementation!
|
||||
Design doc:
|
||||
{task_doc_snake}
|
||||
Task doc:
|
||||
{design_doc_snake}
|
||||
"""
|
||||
GAME_INC_REQ_2048 = """
|
||||
I found an issue with the 2048 code: when tiles are merged, no new tiles pop up.
|
||||
Write code review for the codes (game.py, main.py, ui.py) under under /Users/gary/Files/temp/workspace/2048_game_bugs/src.
|
||||
Then correct any issues you find. You can review all code in one time, and solve issues in one time.
|
||||
"""
|
||||
GAME_INC_REQ_SNAKE = """
|
||||
Based on the design doc at /Users/gary/Files/temp/workspace/snake_game_bugs/docs/20240513200737.json,
|
||||
Write code review for the codes (food.py, game.py, main.py, snake.py, ui.py) under under /Users/gary/Files/temp/workspace/snake_game_bugs/src.
|
||||
Then correct any issues you find. You can read the design doc first, then review all code in one time, and solve issues in one time.
|
||||
"""
|
||||
|
||||
if __name__ == "__main__":
|
||||
engineer2 = Engineer2(tools=["Plan", "Editor:write,read,write_content", "MGXEnv:ask_human,reply_to_human"])
|
||||
asyncio.run(engineer2.run(GAME_INC_REQ_2048))
|
||||
|
|
@ -49,6 +49,7 @@ from metagpt.const import (
|
|||
)
|
||||
from metagpt.logs import logger
|
||||
from metagpt.repo_parser import DotClassInfo
|
||||
from metagpt.tools.tool_registry import register_tool
|
||||
from metagpt.utils.common import CodeParser, any_to_str, any_to_str_set, import_class
|
||||
from metagpt.utils.exceptions import handle_exception
|
||||
from metagpt.utils.report import TaskReporter
|
||||
|
|
@ -430,7 +431,17 @@ class TaskResult(BaseModel):
|
|||
is_success: bool
|
||||
|
||||
|
||||
@register_tool(
|
||||
include_functions=[
|
||||
"append_task",
|
||||
"reset_task",
|
||||
"replace_task",
|
||||
"finish_current_task",
|
||||
]
|
||||
)
|
||||
class Plan(BaseModel):
|
||||
"""Plan is a sequence of tasks towards a goal."""
|
||||
|
||||
goal: str
|
||||
context: str = ""
|
||||
tasks: list[Task] = []
|
||||
|
|
@ -503,13 +514,10 @@ class Plan(BaseModel):
|
|||
|
||||
def reset_task(self, task_id: str):
|
||||
"""
|
||||
Clear code and result of the task based on task_id, and set the task as unfinished.
|
||||
Reset a task based on task_id, i.e. set Task.is_finished=False and request redo. This also resets all tasks depending on it.
|
||||
|
||||
Args:
|
||||
task_id (str): The ID of the task to be reset.
|
||||
|
||||
Returns:
|
||||
None
|
||||
"""
|
||||
if task_id in self.task_map:
|
||||
task = self.task_map[task_id]
|
||||
|
|
@ -522,7 +530,7 @@ class Plan(BaseModel):
|
|||
|
||||
self._update_current_task()
|
||||
|
||||
def replace_task(self, new_task: Task):
|
||||
def _replace_task(self, new_task: Task):
|
||||
"""
|
||||
Replace an existing task with the new input task based on task_id, and reset all tasks depending on it.
|
||||
|
||||
|
|
@ -547,7 +555,7 @@ class Plan(BaseModel):
|
|||
|
||||
self._update_current_task()
|
||||
|
||||
def append_task(self, new_task: Task):
|
||||
def _append_task(self, new_task: Task):
|
||||
"""
|
||||
Append a new task to the end of existing task sequences
|
||||
|
||||
|
|
@ -615,6 +623,23 @@ class Plan(BaseModel):
|
|||
"""
|
||||
return [task for task in self.tasks if task.is_finished]
|
||||
|
||||
def append_task(self, task_id: str, dependent_task_ids: list[str], instruction: str, assignee: str):
|
||||
"""Append a new task with task_id (number) to the end of existing task sequences. If dependent_task_ids is not empty, the task will depend on the tasks with the ids in the list."""
|
||||
new_task = Task(
|
||||
task_id=task_id, dependent_task_ids=dependent_task_ids, instruction=instruction, assignee=assignee
|
||||
)
|
||||
return self._append_task(new_task)
|
||||
|
||||
def replace_task(self, task_id: str, new_dependent_task_ids: list[str], new_instruction: str, new_assignee: str):
|
||||
"""Replace an existing task (can be current task) based on task_id, and reset all tasks depending on it."""
|
||||
new_task = Task(
|
||||
task_id=task_id,
|
||||
dependent_task_ids=new_dependent_task_ids,
|
||||
instruction=new_instruction,
|
||||
assignee=new_assignee,
|
||||
)
|
||||
return self._replace_task(new_task)
|
||||
|
||||
|
||||
class MessageQueue(BaseModel):
|
||||
"""Message queue which supports asynchronous updates."""
|
||||
|
|
|
|||
|
|
@ -137,8 +137,26 @@ def validate_tool_names(tools: list[str]) -> dict[str, Tool]:
|
|||
# if tool paths are provided, they will be registered on the fly
|
||||
if os.path.isdir(key) or os.path.isfile(key):
|
||||
valid_tools.update(register_tools_from_path(key))
|
||||
elif TOOL_REGISTRY.has_tool(key):
|
||||
valid_tools.update({key: TOOL_REGISTRY.get_tool(key)})
|
||||
elif TOOL_REGISTRY.has_tool(key.split(":")[0]):
|
||||
if ":" in key:
|
||||
# handle class tools with methods specified, such as Editor:read,write
|
||||
class_tool_name = key.split(":")[0]
|
||||
method_names = key.split(":")[1].split(",")
|
||||
class_tool = TOOL_REGISTRY.get_tool(class_tool_name)
|
||||
|
||||
methods_filtered = {}
|
||||
for method_name in method_names:
|
||||
if method_name in class_tool.schemas["methods"]:
|
||||
methods_filtered[method_name] = class_tool.schemas["methods"][method_name]
|
||||
else:
|
||||
logger.warning(f"invalid method {method_name} under tool {class_tool_name}, skipped")
|
||||
class_tool_filtered = class_tool.model_copy(deep=True)
|
||||
class_tool_filtered.schemas["methods"] = methods_filtered
|
||||
|
||||
valid_tools.update({class_tool_name: class_tool_filtered})
|
||||
|
||||
else:
|
||||
valid_tools.update({key: TOOL_REGISTRY.get_tool(key)})
|
||||
elif TOOL_REGISTRY.has_tool_tag(key):
|
||||
valid_tools.update(TOOL_REGISTRY.get_tools_by_tag(key))
|
||||
else:
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue