Merge pull request #1288 from usamimeri/huoshan

Feat: Add Ark support (For Doubao)
2026-04-28 02:23:52 +02:00 · 2024-05-29 16:21:51 +08:00 · 2024-05-29 16:21:51 +08:00 · a705a515fb
commit a705a515fb
parent 316a49a478 fbb307442c
7 changed files with 154 additions and 0 deletions
--- a/metagpt/provider/init.py
+++ b/metagpt/provider/init.py
@ -18,6 +18,7 @@ from metagpt.provider.qianfan_api import QianFanLLM
 from metagpt.provider.dashscope_api import DashScopeLLM
 from metagpt.provider.anthropic_api import AnthropicLLM
 from metagpt.provider.bedrock_api import BedrockLLM
+from metagpt.provider.ark_api import ArkLLM

 __all__ = [
    "GeminiLLM",
@ -32,4 +33,5 @@ __all__ = [
    "DashScopeLLM",
    "AnthropicLLM",
    "BedrockLLM",
+    "ArkLLM",
 ]
--- a/metagpt/provider/ark_api.py
+++ b/metagpt/provider/ark_api.py
@ -0,0 +1,44 @@
+from openai import AsyncStream
+from openai.types import CompletionUsage
+from openai.types.chat import ChatCompletion, ChatCompletionChunk
+
+from metagpt.configs.llm_config import LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
+from metagpt.logs import log_llm_stream
+from metagpt.provider.llm_provider_registry import register_provider
+from metagpt.provider.openai_api import OpenAILLM
+
+
+@register_provider(LLMType.ARK)
+class ArkLLM(OpenAILLM):
+    """
+    用于火山方舟的API
+    见：https://www.volcengine.com/docs/82379/1263482
+    """
+
+    async def _achat_completion_stream(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> str:
+        response: AsyncStream[ChatCompletionChunk] = await self.aclient.chat.completions.create(
+            **self._cons_kwargs(messages, timeout=self.get_timeout(timeout)),
+            stream=True,
+            extra_body={"stream_options": {"include_usage": True}}  # 只有增加这个参数才会在流式时最后返回usage
+        )
+        usage = None
+        collected_messages = []
+        async for chunk in response:
+            chunk_message = chunk.choices[0].delta.content or "" if chunk.choices else ""  # extract the message
+            log_llm_stream(chunk_message)
+            collected_messages.append(chunk_message)
+            if chunk.usage:
+                # 火山方舟的流式调用会在最后一个chunk中返回usage,最后一个chunk的choices为[]
+                usage = CompletionUsage(**chunk.usage)
+
+        log_llm_stream("\n")
+        full_reply_content = "".join(collected_messages)
+        self._update_costs(usage, chunk.model)
+        return full_reply_content
+
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> ChatCompletion:
+        kwargs = self._cons_kwargs(messages, timeout=self.get_timeout(timeout))
+        rsp: ChatCompletion = await self.aclient.chat.completions.create(**kwargs)
+        self._update_costs(rsp.usage, rsp.model)
+        return rsp