Refactor model server hardware config + add unit tests to load/request to the server (#189)

* remove mode/hardware * add test and pre commit hook * add pytest dependieces * fix format * fix lint * fix precommit * fix pre commit * fix pre commit * fix precommit * fix precommit * fix precommit * fix precommit * fix precommit * fix precommit * fix precommit * fix precommit * fix precommit * fix precommit
2026-06-20 15:28:07 +02:00 · 2024-10-16 16:58:10 -07:00 · 2024-10-16 16:58:10 -07:00 · 8e54ac20d8
commit 8e54ac20d8
parent 3bd2ffe9fb
13 changed files with 480 additions and 43 deletions
--- a/model_server/app/main.py
+++ b/model_server/app/main.py
@ -13,6 +13,7 @@ from app.commons.constants import embedding_model, zero_shot_model, arch_guard_h
 from app.function_calling.model_utils import (
    chat_completion as arch_function_chat_completion,
 )
+from unittest.mock import patch

 logger = utils.get_model_server_logger()

@ -173,6 +174,7 @@ async def zeroshot(req: ZeroShotRequest, res: Response):


@app.post("/hallucination")
+@patch("app.loader.glb.DEVICE", "cpu")  # Mock the device to 'cpu'
 async def hallucination(req: HallucinationRequest, res: Response):
    """
    Take input as text and return the prediction of hallucination for each parameter