Add files via upload
Increasing timeout for heavy load situatuions
This commit is contained in:
parent
295ace0401
commit
64549b4e1c
1 changed files with 4 additions and 4 deletions
|
|
@ -71,7 +71,7 @@ async def fetch_available_models(endpoint: str) -> Set[str]:
|
|||
set is returned.
|
||||
"""
|
||||
try:
|
||||
async with httpx.AsyncClient(timeout=1.0) as client:
|
||||
async with httpx.AsyncClient(timeout=5.0) as client:
|
||||
if "/v1" in endpoint:
|
||||
resp = await client.get(f"{endpoint}/models")
|
||||
else:
|
||||
|
|
@ -118,12 +118,12 @@ async def fetch_endpoint_details(endpoint: str, route: str, detail: str) -> List
|
|||
resp = await client.get(f"{endpoint}{route}")
|
||||
resp.raise_for_status()
|
||||
data = resp.json()
|
||||
detail = data.get(detail)
|
||||
detail = data.get(detail, [])
|
||||
return detail
|
||||
except Exception as e:
|
||||
# If anything goes wrong we cannot reply details
|
||||
print(e)
|
||||
return {detail: ["N/A"]}
|
||||
return {detail: []}
|
||||
|
||||
def ep2base(ep):
|
||||
if "/v1" in ep:
|
||||
|
|
@ -795,7 +795,7 @@ async def ps_proxy(request: Request):
|
|||
for modellist in loaded_models:
|
||||
models['models'] += modellist
|
||||
|
||||
# 25. Return a JSONResponse with deduplicated currently deployed models
|
||||
# 2. Return a JSONResponse with deduplicated currently deployed models
|
||||
return JSONResponse(
|
||||
content={"models": dedupe_on_keys(models['models'], ['digest'])},
|
||||
status_code=200,
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue