example fix

This commit is contained in:
liuminhui 2025-02-28 16:12:05 +08:00
parent c7314e31b8
commit 178ddaecb1
8 changed files with 14 additions and 9 deletions

View file

@ -9,7 +9,7 @@ from pathlib import Path
import typer
from metagpt.config2 import config
from metagpt.config2 import Config
from metagpt.environment.android.android_env import AndroidEnv
from metagpt.ext.android_assistant.roles.android_assistant import AndroidAssistant
from metagpt.team import Team
@ -41,6 +41,7 @@ def startup(
),
device_id: str = typer.Option(default="emulator-5554", help="The Android device_id"),
):
config = Config.default()
config.extra = {
"stage": stage,
"mode": mode,

BIN
examples/data/di/dog.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 15 KiB

Binary file not shown.

After

Width:  |  Height:  |  Size: 33 KiB

Binary file not shown.

View file

@ -1,17 +1,18 @@
from metagpt.const import EXAMPLE_DATA_PATH
from metagpt.roles.di.data_interpreter import DataInterpreter
async def main():
# Notice: pip install metagpt[ocr] before using this example
image_path = "image.jpg"
image_path = EXAMPLE_DATA_PATH / "di/receipt_shopping.jpg"
language = "English"
requirement = f"""This is a {language} receipt image.
Your goal is to perform OCR on images using PaddleOCR, output text content from the OCR results and discard
coordinates and confidence levels, then recognize the total amount from ocr text content, and finally save as table.
coordinates and confidence levels, then recognize the total amount from ocr text content, and finally save as csv table.
Image path: {image_path}.
NOTE: The environments for Paddle and PaddleOCR are all ready and has been fully installed."""
di = DataInterpreter()
di = DataInterpreter(react_mode="react")
print(requirement)
await di.run(requirement)

View file

@ -1,5 +1,6 @@
import asyncio
from metagpt.const import DEFAULT_WORKSPACE_ROOT, EXAMPLE_DATA_PATH
from metagpt.roles.di.data_interpreter import DataInterpreter
@ -9,7 +10,7 @@ async def main(requirement: str = ""):
if __name__ == "__main__":
image_path = "/your/path/to/the/image.jpeg"
save_path = "/your/intended/save/path/for/image_rm_bg.png"
image_path = EXAMPLE_DATA_PATH / "di/dog.jpg"
save_path = DEFAULT_WORKSPACE_ROOT / "image_rm_bg.png"
requirement = f"This is a image, you need to use python toolkit rembg to remove the background of the image and save the result. image path:{image_path}; save path:{save_path}."
asyncio.run(main(requirement))

View file

@ -1,6 +1,6 @@
import asyncio
from metagpt.config2 import config
from metagpt.config2 import Config
from metagpt.const import EXAMPLE_DATA_PATH
from metagpt.logs import logger
from metagpt.rag.parsers import OmniParse
@ -12,6 +12,8 @@ TEST_PDF = EXAMPLE_DATA_PATH / "omniparse/test02.pdf"
TEST_VIDEO = EXAMPLE_DATA_PATH / "omniparse/test03.mp4"
TEST_AUDIO = EXAMPLE_DATA_PATH / "omniparse/test04.mp3"
config = Config.default()
async def omniparse_client_example():
client = OmniParseClient(base_url=config.omniparse.base_url)

View file

@ -5,7 +5,7 @@
from gymnasium import spaces
from pydantic import ConfigDict, Field
from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvActionType
from metagpt.base.base_env_space import BaseEnvAction, BaseEnvActionType
from metagpt.environment.werewolf.const import STEP_INSTRUCTIONS