mirror of
https://github.com/katanemo/plano.git
synced 2026-06-14 15:15:15 +02:00
model server build (#127)
* first commit to have model_server not be dependent on Docker * making changes to fix the docker-compose file for archgw to set DNS_V4 and minor fixes with the build * additional fixes for model server to be separated out in the build * additional fixes for model server to be separated out in the build * fix to get model_server to be built as a separate python process. TODO: fix the embeddings logs after cli completes * fixing init to pull tempfile using the tempfile python package --------- Co-authored-by: Salman Paracha <salmanparacha@MacBook-Pro-261.local>
This commit is contained in:
parent
7d21359f5b
commit
b60ceb9168
21 changed files with 3390 additions and 154 deletions
37
model_server/pyproject.toml
Normal file
37
model_server/pyproject.toml
Normal file
|
|
@ -0,0 +1,37 @@
|
|||
[tool.poetry]
|
||||
name = "archgw_modelserver"
|
||||
version = "0.1.0"
|
||||
description = "A model server for serving models"
|
||||
authors = ["Katanemo Labs, Inc <archgw@katanemo.com>"]
|
||||
license = "Apache 2.0"
|
||||
readme = "README.md"
|
||||
packages = [
|
||||
{ include = "app" }, # Include the 'app' package
|
||||
{ include = "app/arch_fc" }, # Include the 'app' package
|
||||
]
|
||||
include = ["app/*.yaml"]
|
||||
|
||||
[tool.poetry.dependencies]
|
||||
python = ">=3.10"
|
||||
fastapi = "0.115.0"
|
||||
sentence-transformers = "3.1.1"
|
||||
torch = "2.4.1"
|
||||
uvicorn = "0.31.0"
|
||||
transformers = "*"
|
||||
pyyaml = "6.0.2"
|
||||
accelerate = "*"
|
||||
psutil = "6.0.0"
|
||||
optimum-intel = "*"
|
||||
openvino = "*"
|
||||
pandas = "*"
|
||||
dateparser = "*"
|
||||
openai = "1.50.2"
|
||||
tf-keras = "*"
|
||||
onnx = "*"
|
||||
|
||||
[tool.poetry.scripts]
|
||||
archgw_modelserver = "app:run_server"
|
||||
|
||||
[build-system]
|
||||
requires = ["poetry-core>=1.0.0"]
|
||||
build-backend = "poetry.core.masonry.api"
|
||||
Loading…
Add table
Add a link
Reference in a new issue