Merge branch 'feat-intention-fs' into 'mgx_ops'

fixbug: 限制quick_think生成内容，防止模型在quick_think里直接生成快问快答的答案 See merge request pub/MetaGPT!299
2026-07-23 17:01:08 +02:00 · 2024-08-14 06:53:29 +00:00 · 2024-08-14 06:53:29 +00:00 · a7f0a387f7
commit a7f0a387f7
parent c7dadaa4d7 3490a4e234
5 changed files with 48 additions and 32 deletions
--- a/metagpt/prompts/di/role_zero.py
+++ b/metagpt/prompts/di/role_zero.py
@ -125,30 +125,46 @@ If no issues are detected, the original json data should be returned unchanged.
 Output the JSON data in a format that can be loaded by the json.loads() function.
 """

-QUICK_THINK_PROMPT = """
+QUICK_THINK_SYSTEM_PROMPT = """
+{role_info}
+Your role is to determine the appropriate response category for the given request.
+
 # Response Categories
 ## QUICK: 
-For straightforward questions or requests that can be answered directly. This includes common-sense inquiries, legal or logical questions, basic math, short coding tasks, multiple-choice questions, greetings, casual chat, and inquiries about you or your team.
+For straightforward questions or requests that can be answered directly. This includes common-sense inquiries, legal or logical questions, basic math, short coding tasks, multiple-choice questions, greetings, casual chat, daily planning, and inquiries about you or your team.

 ## SEARCH
 For queries that require retrieving up-to-date or detailed information. This includes time-sensitive or location-specific questions like current events or weather. Use this only if the information isn't readily available.
+If a file or link is provided, you don't need to search for additional information.

 ## TASK
-For complex requests that involve multiple steps or detailed instructions. Examples include software development, project planning, or any task that requires a sequence of actions.
+For requests that involve tool utilizations, computer operations, multiple steps or detailed instructions. Examples include software development, project planning, or any task that requires tool usage.

 ## AMBIGUOUS
 For requests that are unclear, lack sufficient detail, or are outside the system's capabilities. Common characteristics of AMBIGUOUS requests:

- Incomplete Information: Requests that imply complex tasks but lack critical details  (e.g., "Redesign this logo" without providing the original logo or specifying design requirements).
+- Incomplete Information: Requests that imply complex tasks but lack critical details  (e.g., "Redesign this logo" without specifying design requirements).
 - Vagueness: Broad, unspecified, or unclear requests that make it difficult to provide a precise answer. 
- Out of Expertise: Requests for specialized advice (e.g., medical or legal advice) or highly technical tasks beyond the model's scope.
 - Unrealistic Scope: Overly broad requests that are impossible to address meaningfully in a single response (e.g., "Tell me everything about...").
+- Missing files: Requests that refer to specific documents, images, or data without providing them for reference. (when providing a file, website, or data, either the content, link, or path **must** be included)

-**Note:** Before categorizing a request as TASK, consider whether the user has provided sufficient information to proceed with the task. If the request is complex but lacks essential details or the mentioned files, it should fall under AMBIGUOUS.
+**Note:** Before categorizing a request as TASK:
+1. Consider whether the user has provided sufficient information to proceed with the task. If the request is complex but lacks essential details or the mentioned files' content or path, it should fall under AMBIGUOUS.
+2. If the request is a "how-to" question that asks for a general plan, approach or strategy, it should be categorized as QUICK.

 {examples}
+"""

-Respond with a concise thought, then provide the appropriate response category: QUICK, SEARCH, TASK, or AMBIGUOUS. Your response:
+QUICK_THINK_PROMPT = """
+# Instruction
+Determine the previous message's intent.
+Respond with a concise thought, then provide the appropriate response category: QUICK, SEARCH, TASK, or AMBIGUOUS. 
+
+# Format
+Thought: [Your thought here]
+Response Category: [QUICK/SEARCH/TASK/AMBIGUOUS]
+
+# Response:
 """


@ -163,8 +179,8 @@ Response Category: QUICK.
 Thought: This is a general knowledge question that can be answered concisely. 
 Response Category: QUICK.

-3. Request: "Can you help me plan a healthy diet for a week?"
-Thought: The user is requesting a simple plan that can be provided immediately. 
+3. Request: "Please help me write a learning plan for Python web crawlers"
+Thought: Writing a learning plan is a daily planning task that can be answered directly.
 Response Category: QUICK.

 4. Request: "Can you help me find the latest research papers on deep learning?"
@ -176,18 +192,15 @@ Thought: This is a detailed software development task that requires multiple ste
 Response Category: TASK.

 6. Request: "Summarize this document for me."
-Thought: The request mentions summarizing a document but doesn't provide the document itself, making it impossible to fulfill. 
+Thought: The request mentions summarizing a document but doesn't provide the path or content of the document, making it impossible to fulfill. 
 Response Category: AMBIGUOUS.

-7. Request: "Optimize this process." 
+7. Request: "Summarize this document for me '/data/path/docmument.pdf'." 
+Thought: The request mentions summarizing a document and has provided the path to the document. It can be done by reading the document using a tool then summarizing it.
+Response Category: TASK.
+
+8. Request: "Optimize this process." 
 Thought: The request is vague and lacks specifics, requiring clarification on the process to optimize.
 Response Category: AMBIGUOUS.

-8. Request: "Create a poster for our upcoming event." 
-Thought: Critical details like event theme, date, and location are missing, making it impossible to complete the task.
-Response Category: AMBIGUOUS.
-
-# Instruction
 """
-
-QUICK_THINK_PROMPT = QUICK_THINK_PROMPT.format(examples=QUICK_THINK_EXAMPLES)
--- a/metagpt/prompts/di/team_leader.py
+++ b/metagpt/prompts/di/team_leader.py
@ -35,11 +35,11 @@ Sixth, describe the requirements as they pertain to software development, data a
 Seventh, describe the technologies you must use.  
 """
 )
-QUICK_THINK_SYSTEM_PROMPT = """
+
+TL_INFO = """
 {role_info}
 Your team member:
 {team_info}
-However, you MUST respond to the user message by yourself directly, DON'T ask your team members.
 """

 FINISH_CURRENT_TASK_CMD = """
--- a/metagpt/roles/di/data_analyst.py
+++ b/metagpt/roles/di/data_analyst.py
@ -30,7 +30,7 @@ class DataAnalyst(RoleZero):
    instruction: str = ROLE_INSTRUCTION + EXTRA_INSTRUCTION
    task_type_desc: str = TASK_TYPE_DESC

-    tools: list[str] = ["Plan", "DataAnalyst", "RoleZero", "Browser"]
+    tools: list[str] = ["Plan", "DataAnalyst", "RoleZero", "Browser", "Editor:write,read"]
    custom_tools: list[str] = ["web scraping", "Terminal"]
    custom_tool_recommender: ToolRecommender = None
    experience_retriever: Annotated[ExpRetriever, Field(exclude=True)] = KeywordExpRetriever()
--- a/metagpt/roles/di/role_zero.py
+++ b/metagpt/roles/di/role_zero.py
@ -21,6 +21,8 @@ from metagpt.prompts.di.role_zero import (
    CMD_PROMPT,
    JSON_REPAIR_PROMPT,
    QUICK_THINK_PROMPT,
+    QUICK_THINK_EXAMPLES,
+    QUICK_THINK_SYSTEM_PROMPT,
    REGENERATE_PROMPT,
    ROLE_INSTRUCTION,
    SYSTEM_PROMPT,
@ -253,6 +255,10 @@ class RoleZero(Role):
            rsp = await self._act()
            actions_taken += 1
        return rsp  # return output from the last action
+    
+    def format_quick_system_prompt(self) -> str:
+        """Format the system prompt for quick thinking."""
+        return QUICK_THINK_SYSTEM_PROMPT.format(examples=QUICK_THINK_EXAMPLES, role_info=self._get_prefix())

    async def _quick_think(self) -> Tuple[Message, str]:
        answer = ""
@ -264,7 +270,7 @@ class RoleZero(Role):
        # routing
        memory = self.get_memories(k=4)  # FIXME: A magic number for two rounds of Q&A
        context = self.llm.format_msg(memory + [UserMessage(content=QUICK_THINK_PROMPT)])
-        intent_result = await self.llm.aask(context)
+        intent_result = await self.llm.aask(context, system_msgs=self.format_quick_system_prompt())

        if "QUICK" in intent_result or "AMBIGUOUS " in intent_result:  # llm call with the original context
            async with ThoughtReporter(enable_llm_stream=True) as reporter:
--- a/metagpt/roles/di/team_leader.py
+++ b/metagpt/roles/di/team_leader.py
@ -7,7 +7,7 @@ from pydantic import Field
 from metagpt.actions.di.run_command import RunCommand
 from metagpt.prompts.di.team_leader import (
    FINISH_CURRENT_TASK_CMD,
-    QUICK_THINK_SYSTEM_PROMPT,
+    TL_INFO,
    TL_INSTRUCTION,
    TL_THOUGHT_GUIDANCE,
 )
@ -47,15 +47,12 @@ class TeamLeader(RoleZero):
            #     continue
            team_info += f"{role.name}: {role.profile}, {role.goal}\n"
        return team_info
-
-    async def _quick_think(self) -> Message:
-        # insert team info for quick question
-        self.llm.system_prompt = QUICK_THINK_SYSTEM_PROMPT.format(
-            role_info=super()._get_prefix(),
-            team_info=self._get_team_info(),
-        )
-        return await super()._quick_think()
-
+    
+    def _get_prefix(self) -> str:
+        role_info = super()._get_prefix()
+        team_info = self._get_team_info()
+        return TL_INFO.format(role_info=role_info, team_info=team_info)
+    
    async def _think(self) -> bool:
        self.instruction = TL_INSTRUCTION.format(team_info=self._get_team_info())
        return await super()._think()