2024-10-09 11:42:05 -07:00
|
|
|
pub const DEFAULT_EMBEDDING_MODEL: &str = "katanemo/bge-large-en-v1.5";
|
2024-10-09 19:10:08 -07:00
|
|
|
pub const DEFAULT_INTENT_MODEL: &str = "katanemo/bart-large-mnli";
|
2024-09-16 19:20:07 -07:00
|
|
|
pub const DEFAULT_PROMPT_TARGET_THRESHOLD: f64 = 0.8;
|
2024-10-15 11:43:05 -07:00
|
|
|
pub const DEFAULT_HALLUCINATED_THRESHOLD: f64 = 0.25;
|
2024-09-27 16:41:39 -07:00
|
|
|
pub const RATELIMIT_SELECTOR_HEADER_KEY: &str = "x-arch-ratelimit-selector";
|
2024-07-30 16:23:23 -07:00
|
|
|
pub const SYSTEM_ROLE: &str = "system";
|
|
|
|
|
pub const USER_ROLE: &str = "user";
|
2024-09-10 14:24:46 -07:00
|
|
|
pub const GPT_35_TURBO: &str = "gpt-3.5-turbo";
|
2024-09-27 16:41:39 -07:00
|
|
|
pub const ARC_FC_CLUSTER: &str = "arch_fc";
|
|
|
|
|
pub const ARCH_FC_REQUEST_TIMEOUT_MS: u64 = 120000; // 2 minutes
|
2024-10-01 11:24:43 -07:00
|
|
|
pub const MODEL_SERVER_NAME: &str = "model_server";
|
2024-09-27 16:41:39 -07:00
|
|
|
pub const ARCH_ROUTING_HEADER: &str = "x-arch-llm-provider";
|
2024-10-01 09:14:01 -07:00
|
|
|
pub const ARCH_MESSAGES_KEY: &str = "arch_messages";
|
2024-10-03 10:57:01 -07:00
|
|
|
pub const ARCH_PROVIDER_HINT_HEADER: &str = "x-arch-llm-provider-hint";
|
2024-10-18 12:53:44 -07:00
|
|
|
pub const CHAT_COMPLETIONS_PATH: &str = "/v1/chat/completions";
|
2024-10-07 00:03:25 -07:00
|
|
|
pub const ARCH_STATE_HEADER: &str = "x-arch-state";
|
2024-10-07 18:38:55 -07:00
|
|
|
pub const ARCH_FC_MODEL_NAME: &str = "Arch-Function-1.5B";
|
2024-10-08 16:24:08 -07:00
|
|
|
pub const REQUEST_ID_HEADER: &str = "x-request-id";
|
|
|
|
|
pub const ARCH_INTERNAL_CLUSTER_NAME: &str = "arch_internal";
|
|
|
|
|
pub const ARCH_UPSTREAM_HOST_HEADER: &str = "x-arch-upstream";
|
2024-10-09 15:47:32 -07:00
|
|
|
pub const ARCH_LLM_UPSTREAM_LISTENER: &str = "arch_llm_listener";
|
2024-10-15 11:43:05 -07:00
|
|
|
pub const ARCH_MODEL_PREFIX: &str = "Arch";
|