use profile as sender & fix some bugs

2026-07-20 16:51:07 +02:00 · 2023-08-03 16:00:28 +08:00 · 2023-08-03 16:00:28 +08:00 · e546dbd6b8
commit e546dbd6b8
parent 144af68c09
5 changed files with 35 additions and 29 deletions
--- a/metagpt/actions/debug_error.py
+++ b/metagpt/actions/debug_error.py
@ -14,15 +14,15 @@ from metagpt.utils.common import CodeParser
 PROMPT_TEMPLATE = """
 NOTICE
 1. Role: You are a Development Engineer or QA engineer;
-2. Task: You received this message from another Development Engineer or QA engineer who run or test your code. 
+2. Task: You received this message from another Development Engineer or QA engineer who ran or tested your code. 
 Based on the message, first, figure out your own role, i.e. Engineer or QaEngineer,
 then rewrite the development code or the test code based on your role, the error, and the summary, such that all bugs are fixed and the code performs well.
-Attention: Use '##' to split sections, not '#', and '## <SECTION_NAME>' SHOULD WRITE BEFORE the test case or script and triple quote.
+Attention: Use '##' to split sections, not '#', and '## <SECTION_NAME>' SHOULD WRITE BEFORE the test case or script and triple quotes.
 The message is as follows:
 {context}
 ---
 Now you should start rewriting the code:
-## file name of the code to rewrite: Write code with triple quoto. Do your best to implement THIS ONLY ONE FILE.
+## file name of the code to rewrite: Write code with triple quoto. Do your best to implement THIS IN ONLY ONE FILE.
 """
 class DebugError(Action):
    def __init__(self, name="DebugError", context=None, llm=None):
--- a/metagpt/actions/run_code.py
+++ b/metagpt/actions/run_code.py
@ -8,6 +8,7 @@
 import traceback
 import os
 import subprocess
+from typing import List, Tuple

 from metagpt.logs import logger
 from metagpt.actions.action import Action
@ -59,18 +60,18 @@ class RunCode(Action):
        super().__init__(name, context, llm)

    @classmethod
-    async def run_text(cls, code):
+    async def run_text(cls, code) -> Tuple[str, str]:
        try:
            # We will document_store the result in this dictionary
            namespace = {}
            exec(code, namespace)
-            return namespace.get('result', None), ""
+            return namespace.get('result', ""), ""
        except Exception:
            # If there is an error in the code, return the error message
            return "", traceback.format_exc()

    @classmethod
-    async def run_script(cls, working_directory, additional_python_paths=[], command=[]):
+    async def run_script(cls, working_directory, additional_python_paths=[], command=[]) -> Tuple[str, str]:
        working_directory = str(working_directory)
        additional_python_paths = [str(path) for path in additional_python_paths]

@ -93,16 +94,16 @@ class RunCode(Action):
            process.kill()  # Kill the process if it times out
            stdout, stderr = process.communicate()
        return stdout.decode('utf-8'), stderr.decode('utf-8')
-    
+
    async def run(
        self, code, mode="script", code_file_name="", test_code="", test_file_name="", command=[], **kwargs
-    ):
+    ) -> str:
        logger.info(f"Running {' '.join(command)}")
        if mode == "script":
            outs, errs = await self.run_script(command=command, **kwargs)
        elif mode == "text":
            outs, errs = await self.run_text(code=code)
-        
+
        logger.info(f"{outs=}")
        logger.info(f"{errs=}")

@ -111,9 +112,9 @@ class RunCode(Action):
            test_code=test_code, test_file_name=test_file_name,
            command=" ".join(command),
            outs=outs[:500], # outs might be long but they are not important, truncate them to avoid token overflow
-            errs=errs
+            errs=errs[:10000] # truncate errors to avoid token overflow
        )
-        
+
        prompt = PROMPT_TEMPLATE.format(context=context)
        rsp = await self._aask(prompt)

--- a/metagpt/actions/write_test.py
+++ b/metagpt/actions/write_test.py
@ -15,10 +15,10 @@ NOTICE
 2. Requirement: Based on the context, develop a comprehensive test suite that adequately covers all relevant aspects of the code file under review. Your test suite will be part of the overall project QA, so please develop complete, robust, and reusable test cases.
 3. Attention1: Use '##' to split sections, not '#', and '## <SECTION_NAME>' SHOULD WRITE BEFORE the test case or script.
 4. Attention2: If there are any settings in your tests, ALWAYS SET A DEFAULT VALUE, ALWAYS USE STRONG TYPE AND EXPLICIT VARIABLE.
-5. Attention3: YOU MUST FOLLOW "Data structures and interface definitions". DO NOT CHANGE ANY DESIGN. Make sure your tests respect the existing design and ensure their validity.
+5. Attention3: YOU MUST FOLLOW "Data structures and interface definitions". DO NOT CHANGE ANY DESIGN. Make sure your tests respect the existing design and ensure its validity.
 6. Think before writing: What should be tested and validated in this document? What edge cases could exist? What might fail?
 7. CAREFULLY CHECK THAT YOU DON'T MISS ANY NECESSARY TEST CASES/SCRIPTS IN THIS FILE.
-Attention: Use '##' to split sections, not '#', and '## <SECTION_NAME>' SHOULD WRITE BEFORE the test case or script and triple quote.
+Attention: Use '##' to split sections, not '#', and '## <SECTION_NAME>' SHOULD WRITE BEFORE the test case or script and triple quotes.
 -----
 ## Given the following code, please write appropriate test cases using Python's unittest framework to verify the correctness and robustness of this code:
 ```python
--- a/metagpt/roles/qa_engineer.py
+++ b/metagpt/roles/qa_engineer.py
@ -5,6 +5,7 @@
@Author  : alexanderwu
@File    : qa_engineer.py
 """
+import os
 import re
 from pathlib import Path
 from typing import Type
@ -19,7 +20,7 @@ from metagpt.utils.common import CodeParser, parse_recipient
 from metagpt.utils.special_tokens import MSG_SEP, FILENAME_CODE_SEP

 class QaEngineer(Role):
-    def __init__(self, name="Edward", profile="QA Engineer",
+    def __init__(self, name="Edward", profile="QaEngineer",
                 goal="Write comprehensive and robust tests to ensure codes will work as expected without bugs",
                 constraints="The test code you write should conform to code standard like PEP8, be modular, easy to read and maintain"):
        super().__init__(name, profile, goal, constraints)
@ -86,7 +87,7 @@ class QaEngineer(Role):
            }
            msg = Message(
                content=str(file_info), role=self.profile, cause_by=WriteTest,
-                sent_from="QaEngineer", send_to="QaEngineer"
+                sent_from=self.profile, send_to=self.profile
            )
            self._publish_message(msg)
        
@ -94,14 +95,19 @@ class QaEngineer(Role):
    
    async def _run_code(self, msg):
        file_info = eval(msg.content)
-        code_to_test = open(file_info["file_path"], "r").read()
-        test_code = open(file_info["test_file_path"], "r").read()
+        development_file_path = file_info["file_path"]
+        test_file_path = file_info["test_file_path"]
+        if not os.path.exists(development_file_path) or not os.path.exists(test_file_path):
+            return
+
+        development_code = open(development_file_path, "r").read()
+        test_code = open(test_file_path, "r").read()
        proj_dir = self.get_workspace()
        development_code_dir = self.get_workspace(return_proj_dir=False)

        result_msg = await RunCode().run(
            mode="script",
-            code=code_to_test,
+            code=development_code,
            code_file_name=file_info["file_name"],
            test_code=test_code,
            test_file_name=file_info["test_file_name"],
@ -115,7 +121,7 @@ class QaEngineer(Role):
        content = str(file_info) + FILENAME_CODE_SEP + result_msg
        msg = Message(
            content=content, role=self.profile, cause_by=RunCode,
-            sent_from="QaEngineer", send_to=recipient
+            sent_from=self.profile, send_to=recipient
        )
        self._publish_message(msg)

@ -125,20 +131,20 @@ class QaEngineer(Role):
        if file_name:
            self.write_file(file_name, code)
            recipient = msg.sent_from # send back to the one who ran the code for another run, might be one's self
-            msg = Message(content=file_info, role=self.profile, cause_by=DebugError, sent_from="QaEngineer", send_to=recipient)
+            msg = Message(content=file_info, role=self.profile, cause_by=DebugError, sent_from=self.profile, send_to=recipient)
            self._publish_message(msg)
    
    async def _observe(self) -> int:
        await super()._observe()
        self._rc.news = [msg for msg in self._rc.news \
-            if msg.send_to == "QaEngineer"] # only relevant msgs count as observed news
+            if msg.send_to == self.profile] # only relevant msgs count as observed news
        return len(self._rc.news)

    async def _act(self) -> Message:
        if self.test_round > self.test_round_allowed:
            result_msg = Message(
                content=f"Exceeding {self.test_round_allowed} rounds of tests, skip (writing code counts as a round, too)",
-                role=self.profile, cause_by=WriteTest, sent_from="QaEngineer", send_to=""
+                role=self.profile, cause_by=WriteTest, sent_from=self.profile, send_to=""
            )
            return result_msg

@ -147,16 +153,16 @@ class QaEngineer(Role):
            # might potentially be moved to _think, that is, let the agent decides for itself
            if msg.cause_by == WriteCode:
                # engineer wrote a code, time to write a test for it
-                result_msg = await self._write_test(msg)
+                await self._write_test(msg)
            elif msg.cause_by in [WriteTest, DebugError]:
                # I wrote or debugged my test code, time to run it
-                result_msg = await self._run_code(msg)
+                await self._run_code(msg)
            elif msg.cause_by == RunCode:
                # I ran my test code, time to fix bugs, if any
-                result_msg = await self._debug_error(msg)
+                await self._debug_error(msg)
        self.test_round += 1
        result_msg = Message(
            content=f"Round {self.test_round} of tests done",
-            role=self.profile, cause_by=WriteTest, sent_from="QaEngineer", send_to=""
+            role=self.profile, cause_by=WriteTest, sent_from=self.profile, send_to=""
        )
        return result_msg
--- a/tests/metagpt/actions/test_debug_error.py
+++ b/tests/metagpt/actions/test_debug_error.py
@ -146,11 +146,10 @@ Engineer

@pytest.mark.asyncio
 async def test_debug_error():
-    code = "def add(a, b):\n    return a - b"
-    error = "AssertionError: Expected add(1, 1) to equal 2 but got 0"

    debug_error = DebugError("debug_error")

    file_name, rewritten_code = await debug_error.run(context=EXAMPLE_MSG_CONTENT)

-    assert "class TestPlayer" in rewritten_code
+    assert "class Player" in rewritten_code # rewrite the same class
+    assert "while self.score > 21" in rewritten_code # a key logic to rewrite to (original one is "if self.score > 12")