From 712dfb23b257e738905a20932531498e177b3194 Mon Sep 17 00:00:00 2001 From: usamimeri_renko <1710269958@qq.com> Date: Tue, 21 May 2024 13:13:10 +0800 Subject: [PATCH 1/2] update qwen --- metagpt/utils/token_counter.py | 14 +++++++++----- 1 file changed, 9 insertions(+), 5 deletions(-) diff --git a/metagpt/utils/token_counter.py b/metagpt/utils/token_counter.py index a8652e607..e23cf5682 100644 --- a/metagpt/utils/token_counter.py +++ b/metagpt/utils/token_counter.py @@ -128,11 +128,15 @@ DashScope Token price https://help.aliyun.com/zh/dashscope/developer-reference/t Different model has different detail page. Attention, some model are free for a limited time. """ DASHSCOPE_TOKEN_COSTS = { - "qwen-turbo": {"prompt": 0.0011, "completion": 0.0011}, - "qwen-plus": {"prompt": 0.0028, "completion": 0.0028}, - "qwen-max": {"prompt": 0.0, "completion": 0.0}, - "qwen-max-1201": {"prompt": 0.0, "completion": 0.0}, - "qwen-max-longcontext": {"prompt": 0.0, "completion": 0.0}, + "qwen-turbo": {"prompt": 0.00028, "completion": 0.00083}, + "qwen-long": {"prompt": 0.00007, "completion": 0.00028}, + "qwen-plus": {"prompt": 0.00055, "completion": 0.00166}, + "qwen-max": {"prompt": 0.0055, "completion": 0.0166}, + "qwen-max-0428": {"prompt": 0.0055, "completion": 0.0166}, + "qwen-max-0403": {"prompt": 0.0055, "completion": 0.0166}, + "qwen-max-0107": {"prompt": 0.0055, "completion": 0.0166}, + "qwen-max-1201": {"prompt": 0.0166, "completion": 0.0166}, + "qwen-max-longcontext": {"prompt": 0.0055, "completion": 0.0166}, "llama2-7b-chat-v2": {"prompt": 0.0, "completion": 0.0}, "llama2-13b-chat-v2": {"prompt": 0.0, "completion": 0.0}, "qwen-72b-chat": {"prompt": 0.0, "completion": 0.0}, From 4797c9116804442c672f4b10bee528276458eb69 Mon Sep 17 00:00:00 2001 From: usamimeri_renko <93753250+usamimeri@users.noreply.github.com> Date: Thu, 20 Jun 2024 16:33:54 +0800 Subject: [PATCH 2/2] Update latest qwen price and max token --- metagpt/utils/token_counter.py | 34 +++++++++++++++++++++++++++++++++- 1 file changed, 33 insertions(+), 1 deletion(-) diff --git a/metagpt/utils/token_counter.py b/metagpt/utils/token_counter.py index 43f04cfef..b3391a7e2 100644 --- a/metagpt/utils/token_counter.py +++ b/metagpt/utils/token_counter.py @@ -137,6 +137,18 @@ DashScope Token price https://help.aliyun.com/zh/dashscope/developer-reference/t Different model has different detail page. Attention, some model are free for a limited time. """ DASHSCOPE_TOKEN_COSTS = { + "qwen2-72b-instruct": {"prompt": 0.000714, "completion": 0.001428}, + "qwen2-57b-a14b-instruct": {"prompt": 0.0005, "completion": 0.001}, + "qwen2-7b-instruct": {"prompt": 0.000143, "completion": 0.000286}, + "qwen2-1.5b-instruct": {"prompt": 0, "completion": 0}, + "qwen2-0.5b-instruct": {"prompt": 0, "completion": 0}, + "qwen1.5-110b-chat": {"prompt": 0.001, "completion": 0.002}, + "qwen1.5-72b-chat": {"prompt": 0.000714, "completion": 0.001428}, + "qwen1.5-32b-chat": {"prompt": 0.0005, "completion": 0.001}, + "qwen1.5-14b-chat": {"prompt": 0.000286, "completion": 0.000571}, + "qwen1.5-7b-chat": {"prompt": 0.000143, "completion": 0.000286}, + "qwen1.5-1.8b-chat": {"prompt": 0, "completion": 0}, + "qwen1.5-0.5b-chat": {"prompt": 0, "completion": 0}, "qwen-turbo": {"prompt": 0.00028, "completion": 0.00083}, "qwen-long": {"prompt": 0.00007, "completion": 0.00028}, "qwen-plus": {"prompt": 0.00055, "completion": 0.00166}, @@ -148,7 +160,7 @@ DASHSCOPE_TOKEN_COSTS = { "qwen-max-longcontext": {"prompt": 0.0055, "completion": 0.0166}, "llama2-7b-chat-v2": {"prompt": 0.0, "completion": 0.0}, "llama2-13b-chat-v2": {"prompt": 0.0, "completion": 0.0}, - "qwen-72b-chat": {"prompt": 0.0, "completion": 0.0}, + "qwen-72b-chat": {"prompt": 0.0028, "completion": 0.0028}, "qwen-14b-chat": {"prompt": 0.0011, "completion": 0.0011}, "qwen-7b-chat": {"prompt": 0.00084, "completion": 0.00084}, "qwen-1.8b-chat": {"prompt": 0.0, "completion": 0.0}, @@ -228,6 +240,26 @@ TOKEN_MAX = { "doubao-pro-4k-240515": 4000, "doubao-pro-32k-240515": 32000, "doubao-pro-128k-240515": 128000, + # Qwen https://help.aliyun.com/zh/dashscope/developer-reference/tongyi-qianwen-7b-14b-72b-api-detailes?spm=a2c4g.11186623.0.i20 + "qwen2-57b-a14b-instruct": 32768, + "qwen2-72b-instruct": 131072, + "qwen2-7b-instruct": 32768, + "qwen2-1.5b-instruct": 32768, + "qwen2-0.5b-instruct": 32768, + "qwen1.5-110b-chat": 32000, + "qwen1.5-72b-chat": 32000, + "qwen1.5-32b-chat": 32000, + "qwen1.5-14b-chat": 8000, + "qwen1.5-7b-chat": 32000, + "qwen1.5-1.8b-chat": 32000, + "qwen1.5-0.5b-chat": 32000, + "codeqwen1.5-7b-chat": 64000, + "qwen-72b-chat": 32000, + "qwen-14b-chat": 8000, + "qwen-7b-chat": 32000, + "qwen-1.8b-longcontext-chat": 32000, + "qwen-1.8b-chat": 8000, + } # For Amazon Bedrock US region