Add files via upload

Increasing timeout for heavy load situatuions
This commit is contained in:
Alpha Nerd 2025-09-01 09:01:41 +02:00 committed by GitHub
parent 295ace0401
commit 64549b4e1c
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -71,7 +71,7 @@ async def fetch_available_models(endpoint: str) -> Set[str]:
set is returned.
"""
try:
async with httpx.AsyncClient(timeout=1.0) as client:
async with httpx.AsyncClient(timeout=5.0) as client:
if "/v1" in endpoint:
resp = await client.get(f"{endpoint}/models")
else:
@ -118,12 +118,12 @@ async def fetch_endpoint_details(endpoint: str, route: str, detail: str) -> List
resp = await client.get(f"{endpoint}{route}")
resp.raise_for_status()
data = resp.json()
detail = data.get(detail)
detail = data.get(detail, [])
return detail
except Exception as e:
# If anything goes wrong we cannot reply details
print(e)
return {detail: ["N/A"]}
return {detail: []}
def ep2base(ep):
if "/v1" in ep:
@ -795,7 +795,7 @@ async def ps_proxy(request: Request):
for modellist in loaded_models:
models['models'] += modellist
# 25. Return a JSONResponse with deduplicated currently deployed models
# 2. Return a JSONResponse with deduplicated currently deployed models
return JSONResponse(
content={"models": dedupe_on_keys(models['models'], ['digest'])},
status_code=200,