Merge branch 'main' into adil/tmobile_work

2026-06-17 15:25:17 +02:00 · 2025-09-10 10:47:33 -07:00 · 2025-09-10 10:47:33 -07:00 · 5df01d73f0
commit 5df01d73f0
parent c3a0874829 fb0581fd39
38 changed files with 2842 additions and 919 deletions
--- a/crates/common/src/configuration.rs
+++ b/crates/common/src/configuration.rs
@ -181,8 +181,8 @@ pub struct EmbeddingProviver {
 pub enum LlmProviderType {
    #[serde(rename = "arch")]
    Arch,
-    #[serde(rename = "claude")]
-    Claude,
+    #[serde(rename = "anthropic")]
+    Anthropic,
    #[serde(rename = "deepseek")]
    Deepseek,
    #[serde(rename = "groq")]
@ -199,7 +199,7 @@ impl Display for LlmProviderType {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        match self {
            LlmProviderType::Arch => write!(f, "arch"),
-            LlmProviderType::Claude => write!(f, "claude"),
+            LlmProviderType::Anthropic => write!(f, "anthropic"),
            LlmProviderType::Deepseek => write!(f, "deepseek"),
            LlmProviderType::Groq => write!(f, "groq"),
            LlmProviderType::Gemini => write!(f, "gemini"),
--- a/crates/common/src/consts.rs
+++ b/crates/common/src/consts.rs
@ -12,6 +12,7 @@ pub const ARCH_ROUTING_HEADER: &str = "x-arch-llm-provider";
 pub const MESSAGES_KEY: &str = "messages";
 pub const ARCH_PROVIDER_HINT_HEADER: &str = "x-arch-llm-provider-hint";
 pub const CHAT_COMPLETIONS_PATH: &str = "/v1/chat/completions";
+pub const MESSAGES_PATH: &str = "/v1/messages";
 pub const HEALTHZ_PATH: &str = "/healthz";
 pub const X_ARCH_STATE_HEADER: &str = "x-arch-state";
 pub const X_ARCH_API_RESPONSE: &str = "x-arch-api-response-message";
--- a/crates/common/src/routing.rs
+++ b/crates/common/src/routing.rs
@ -33,6 +33,7 @@ pub fn get_llm_provider(
        return provider;
    }

+
    if llm_providers.default().is_some() {
        return llm_providers.default().unwrap();
    }
--- a/crates/common/src/tokenizer.rs
+++ b/crates/common/src/tokenizer.rs
@ -2,7 +2,7 @@ use log::debug;

 #[allow(dead_code)]
 pub fn token_count(model_name: &str, text: &str) -> Result<usize, String> {
-    debug!("getting token count model={}", model_name);
+    debug!("TOKENIZER: computing token count for model={}", model_name);
    //HACK: add support for tokenizing mistral and other models
    //filed issue https://github.com/katanemo/arch/issues/222