feat: +runtime multi-llm support

This commit is contained in:
莘权 马 2024-07-01 20:23:44 +08:00
parent 9f8f0a27fd
commit 5b15584480
9 changed files with 210 additions and 7 deletions

View file

@ -259,7 +259,6 @@ TOKEN_MAX = {
"qwen-7b-chat": 32000,
"qwen-1.8b-longcontext-chat": 32000,
"qwen-1.8b-chat": 8000,
}
# For Amazon Bedrock US region