remove nli model

This commit is contained in:
Adil Hafeez 2024-12-10 21:03:02 -08:00
parent 3e4b04099c
commit 5bf9a80283
4 changed files with 2 additions and 4 deletions

View file

@ -2,7 +2,6 @@ KATANEMO_DOCKERHUB_REPO = "katanemo/archgw"
KATANEMO_LOCAL_MODEL_LIST = [
"katanemo/Arch-Guard-cpu",
"katanemo/Arch-Guard",
"katanemo/bge-large-en-v1.5",
]
SERVICE_NAME_ARCHGW = "archgw"
SERVICE_NAME_MODEL_SERVER = "model_server"

View file

@ -1,4 +1,3 @@
pub const DEFAULT_EMBEDDING_MODEL: &str = "katanemo/bge-large-en-v1.5";
pub const DEFAULT_INTENT_MODEL: &str = "katanemo/bart-large-mnli";
pub const DEFAULT_PROMPT_TARGET_THRESHOLD: f64 = 0.8;
pub const DEFAULT_HALLUCINATED_THRESHOLD: f64 = 0.25;

View file

@ -15,7 +15,7 @@ WORKDIR /src
# specify list of models that will go into the image as a comma separated list
# following models have been tested to work with this image
# "sentence-transformers/all-MiniLM-L6-v2,sentence-transformers/all-mpnet-base-v2,thenlper/gte-base,thenlper/gte-large,thenlper/gte-small"
ENV MODELS="katanemo/bge-large-en-v1.5-onnx"
ENV MODELS=""
COPY ./app ./app
COPY ./app/guard_model_config.yaml .

View file

@ -45,7 +45,7 @@ RUN if command -v nvcc >/dev/null 2>&1; then \
COPY . /src
# Specify list of models that will go into the image as a comma separated list
ENV MODELS="katanemo/bge-large-en-v1.5-onnx"
ENV MODELS=""
ENV DEBIAN_FRONTEND=noninteractive
COPY /app /app