mirror of
https://github.com/katanemo/plano.git
synced 2026-04-30 03:16:28 +02:00
Some fixes on model server (#362)
* Some fixes on model server * Remove prompt_prefilling message * Fix logging * Fix poetry issues * Improve logging and update the support for text truncation * Fix tests * Fix tests * Fix tests * Fix modelserver tests * Update modelserver tests
This commit is contained in:
parent
ebda682b30
commit
88a02dc478
25 changed files with 1090 additions and 1666 deletions
|
|
@ -1,6 +1,6 @@
|
|||
[tool.poetry]
|
||||
name = "archgw_modelserver"
|
||||
version = "0.1.7"
|
||||
version = "0.1.8"
|
||||
description = "A model server for serving models"
|
||||
authors = ["Katanemo Labs, Inc <info@katanemo.com>"]
|
||||
license = "Apache 2.0"
|
||||
|
|
@ -10,17 +10,15 @@ packages = [
|
|||
]
|
||||
|
||||
[tool.poetry.dependencies]
|
||||
python = "^3.12"
|
||||
python = "^3.10"
|
||||
fastapi = "0.115.0"
|
||||
torch = "2.4.1"
|
||||
uvicorn = "0.31.0"
|
||||
transformers = "*"
|
||||
pyyaml = "6.0.2"
|
||||
accelerate = "*"
|
||||
psutil = "6.0.0"
|
||||
pandas = "*"
|
||||
transformers = "^4.37.0"
|
||||
accelerate = "^1.0.0"
|
||||
pydantic = "^2.10.1"
|
||||
dateparser = "*"
|
||||
openai = "1.50.2"
|
||||
openai = "^1.50.2"
|
||||
httpx = "0.27.2" # https://community.openai.com/t/typeerror-asyncclient-init-got-an-unexpected-keyword-argument-proxies/1040287
|
||||
pytest-asyncio = "*"
|
||||
pytest = "*"
|
||||
|
|
@ -33,7 +31,7 @@ pytest-retry = "^1.6.3"
|
|||
pytest-httpserver = "^1.1.0"
|
||||
|
||||
[tool.poetry.scripts]
|
||||
archgw_modelserver = "src.cli:run_server"
|
||||
archgw_modelserver = "src.cli:main"
|
||||
|
||||
[build-system]
|
||||
requires = ["poetry-core>=1.0.0"]
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue