diff --git a/config/config.yaml b/config/config.yaml index 412da8b15..d8fab693e 100644 --- a/config/config.yaml +++ b/config/config.yaml @@ -88,18 +88,9 @@ TIMEOUT: 60 # Timeout for llm invocation #### for OPENAI VISION -#OPENAI_VISION_URL: "YOUR_OPENAI_ENDPOINT" -#OPENAI_VISION_KEY: "YOUR_API_KEY" #OPENAI_VISION_MODEL: "YOUR_VISION_MODEL_NAME" #VISION_MAX_TOKENS: 4096 -#### for AZURE VISION - -#AZURE_VISION_URL: "YOUR_AZURE_ENDPOINT" -#AZURE_VISION_KEY: "YOUR_API_KEY" -#AZURE_VISION_REGION: "YOUR_VISION_MODEL_NAME" -#VISION_MAX_TOKENS: 4096 - #### for Stable Diffusion ## Use SD service, based on https://github.com/AUTOMATIC1111/stable-diffusion-webui #SD_URL: "YOUR_SD_URL" diff --git a/metagpt/tools/functions/libs/vision.py b/metagpt/tools/functions/libs/vision.py index e6924b9bc..8c29b0567 100644 --- a/metagpt/tools/functions/libs/vision.py +++ b/metagpt/tools/functions/libs/vision.py @@ -11,8 +11,8 @@ import base64 from metagpt.config import CONFIG -OPENAI_API_BASE = CONFIG.OPENAI_VISION_URL -API_KEY = CONFIG.OPENAI_VISION_KEY +OPENAI_API_BASE = CONFIG.OPENAI_BASE_URL +API_KEY = CONFIG.OPENAI_API_KEY MODEL = CONFIG.OPENAI_VISION_MODEL MAX_TOKENS = CONFIG.VISION_MAX_TOKENS @@ -77,6 +77,7 @@ class Vision: if __name__ == "__main__": + image_path = "image.png" vision = Vision() - rsp = vision.generate_web_pages(image_path="./img.png") + rsp = vision.generate_web_pages(image_path=image_path) print(rsp)