release 0.3.2 (#507)

2026-07-23 16:51:04 +02:00 · 2025-06-13 17:02:20 -07:00 · 2025-06-13 17:02:20 -07:00 · 7baec20772
commit 7baec20772
parent 0d6e06dfec
20 changed files with 153 additions and 132 deletions
--- a/crates/common/src/tokenizer.rs
+++ b/crates/common/src/tokenizer.rs
@ -6,15 +6,21 @@ pub fn token_count(model_name: &str, text: &str) -> Result<usize, String> {
    //HACK: add support for tokenizing mistral and other models
    //filed issue https://github.com/katanemo/arch/issues/222

-    let updated_model = match model_name.starts_with("gpt") {
+    let updated_model = match model_name.starts_with("gpt-4") {
        false => {
            debug!(
                "tiktoken_rs: unsupported model: {}, using gpt-4 to compute token count",
                model_name
            );
-            "gpt-4"
+            "gpt-4o"
+        }
+        true => {
+            if model_name.starts_with("gpt-4.1") {
+                "gpt-4o"
+            } else {
+                model_name
+            }
        }
-        true => model_name,
    };

    // Consideration: is it more expensive to instantiate the BPE object every time, or to contend the singleton?