Some fixes on model server (#362)

* Some fixes on model server

* Remove prompt_prefilling message

* Fix logging

* Fix poetry issues

* Improve logging and update the support for text truncation

* Fix tests

* Fix tests

* Fix tests

* Fix modelserver tests

* Update modelserver tests
This commit is contained in:
Shuguang Chen 2025-01-10 16:45:36 -08:00 committed by GitHub
parent ebda682b30
commit 88a02dc478
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
25 changed files with 1090 additions and 1666 deletions

View file

@ -1,6 +1,6 @@
[tool.poetry]
name = "archgw_modelserver"
version = "0.1.7"
version = "0.1.8"
description = "A model server for serving models"
authors = ["Katanemo Labs, Inc <info@katanemo.com>"]
license = "Apache 2.0"
@ -10,17 +10,15 @@ packages = [
]
[tool.poetry.dependencies]
python = "^3.12"
python = "^3.10"
fastapi = "0.115.0"
torch = "2.4.1"
uvicorn = "0.31.0"
transformers = "*"
pyyaml = "6.0.2"
accelerate = "*"
psutil = "6.0.0"
pandas = "*"
transformers = "^4.37.0"
accelerate = "^1.0.0"
pydantic = "^2.10.1"
dateparser = "*"
openai = "1.50.2"
openai = "^1.50.2"
httpx = "0.27.2" # https://community.openai.com/t/typeerror-asyncclient-init-got-an-unexpected-keyword-argument-proxies/1040287
pytest-asyncio = "*"
pytest = "*"
@ -33,7 +31,7 @@ pytest-retry = "^1.6.3"
pytest-httpserver = "^1.1.0"
[tool.poetry.scripts]
archgw_modelserver = "src.cli:run_server"
archgw_modelserver = "src.cli:main"
[build-system]
requires = ["poetry-core>=1.0.0"]