plano/model_server/app/__init__.py
Salman Paracha b60ceb9168
model server build (#127)
* first commit to have model_server not be dependent on Docker

* making changes to fix the docker-compose file for archgw to set DNS_V4 and minor fixes with the build

* additional fixes for model server to be separated out in the build

* additional fixes for model server to be separated out in the build

* fix to get model_server to be built as a separate python process. TODO: fix the embeddings logs after cli completes

* fixing init to pull tempfile using the tempfile python package

---------

Co-authored-by: Salman Paracha <salmanparacha@MacBook-Pro-261.local>
2024-10-06 18:21:43 -07:00

99 lines
3 KiB
Python

import sys
import subprocess
import os
import signal
import time
import requests
import psutil
import tempfile
# Path to the file where the server process ID will be stored
PID_FILE = os.path.join(tempfile.gettempdir(), "model_server.pid")
def run_server():
"""Start, stop, or restart the Uvicorn server based on command-line arguments."""
if len(sys.argv) > 1:
action = sys.argv[1]
else:
action = "start"
if action == "start":
start_server()
elif action == "stop":
stop_server()
elif action == "restart":
restart_server()
else:
print(f"Unknown action: {action}")
sys.exit(1)
def start_server():
"""Start the Uvicorn server and save the process ID."""
if os.path.exists(PID_FILE):
print("Server is already running. Use 'model_server restart' to restart it.")
sys.exit(1)
print(f"Starting Archgw Model Server")
process = subprocess.Popen(
["uvicorn", "app.main:app", "--host", "0.0.0.0", "--port", "51000"],
)
if wait_for_health_check("http://0.0.0.0:51000/healthz"):
# Write the process ID to the PID file
with open(PID_FILE, "w") as f:
f.write(str(process.pid))
print(f"ARCH GW Model Server started with PID {process.pid}")
else:
#Add model_server boot-up logs
print(f"ARCH GW Model Server - Didn't Sart In Time. Shutting Down")
process.terminate()
def wait_for_health_check(url, timeout=180):
"""Wait for the Uvicorn server to respond to health-check requests."""
start_time = time.time()
while time.time() - start_time < timeout:
try:
response = requests.get(url)
if response.status_code == 200:
return True
except requests.ConnectionError:
time.sleep(1)
print("Timed out waiting for ARCH GW Model Server to respond.")
return False
def stop_server():
"""Stop the running Uvicorn server."""
if not os.path.exists(PID_FILE):
print("Status: Archgw Model Server not running")
return
# Read the process ID from the PID file
with open(PID_FILE, "r") as f:
pid = int(f.read())
try:
# Get process by PID
process = psutil.Process(pid)
# Gracefully terminate the process
process.terminate() # Sends SIGTERM by default
process.wait(timeout=10) # Wait for up to 10 seconds for the process to exit
print(f"Server with PID {pid} stopped.")
os.remove(PID_FILE)
except psutil.NoSuchProcess:
print(f"Process with PID {pid} not found. Cleaning up PID file.")
os.remove(PID_FILE)
except psutil.TimeoutExpired:
print(f"Process with PID {pid} did not terminate in time. Forcing shutdown.")
process.kill() # Forcefully kill the process
os.remove(PID_FILE)
def restart_server():
"""Restart the Uvicorn server."""
print("Check: Is Archgw Model Server running?")
stop_server()
start_server()