model server build (#127)

* first commit to have model_server not be dependent on Docker * making changes to fix the docker-compose file for archgw to set DNS_V4 and minor fixes with the build * additional fixes for model server to be separated out in the build * additional fixes for model server to be separated out in the build * fix to get model_server to be built as a separate python process. TODO: fix the embeddings logs after cli completes * fixing init to pull tempfile using the tempfile python package --------- Co-authored-by: Salman Paracha <salmanparacha@MacBook-Pro-261.local>
2026-05-15 11:02:39 +02:00 · 2024-10-06 18:21:43 -07:00 · 2024-10-06 18:21:43 -07:00 · b60ceb9168
commit b60ceb9168
parent 7d21359f5b
21 changed files with 3390 additions and 154 deletions
--- a/model_server/app/utils.py
+++ b/model_server/app/utils.py
@ -2,6 +2,14 @@ import numpy as np
 from concurrent.futures import ThreadPoolExecutor
 import time
 import torch
+import pkg_resources
+import yaml
+
+def load_yaml_config(file_name):
+    # Load the YAML file from the package
+    yaml_path = pkg_resources.resource_filename('app', file_name)
+    with open(yaml_path, 'r') as yaml_file:
+        return yaml.safe_load(yaml_file)


 def split_text_into_chunks(text, max_words=300):
@ -21,7 +29,6 @@ def split_text_into_chunks(text, max_words=300):
 def softmax(x):
    return np.exp(x) / np.exp(x).sum(axis=0)

-
 class PredictionHandler:
    def __init__(self, model, tokenizer, device, task="toxic", hardware_config="cpu"):
        self.model = model