release 0.3.2

2026-06-17 15:25:17 +02:00 · 2025-06-13 15:29:58 -07:00 · 2025-06-13 15:29:58 -07:00 · e3ddd92f03
commit e3ddd92f03
parent 0d6e06dfec
15 changed files with 30 additions and 24 deletions
--- a/.github/workflows/e2e_archgw.yml
+++ b/.github/workflows/e2e_archgw.yml
@ -24,7 +24,7 @@ jobs:

      - name: build arch docker image
        run: |
-          cd ../../ && docker build -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.1 -t katanemo/archgw:latest
+          cd ../../ && docker build -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.2 -t katanemo/archgw:latest

      - name: start archgw
        env:
--- a/.github/workflows/e2e_test_currency_convert.yml
+++ b/.github/workflows/e2e_test_currency_convert.yml
@ -24,7 +24,7 @@ jobs:

      - name: build arch docker image
        run: |
-          docker build  -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.1
+          docker build  -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.2

      - name: install poetry
        run: |
--- a/.github/workflows/e2e_test_preference_based_routing.yml
+++ b/.github/workflows/e2e_test_preference_based_routing.yml
@ -24,7 +24,7 @@ jobs:

      - name: build arch docker image
        run: |
-          docker build  -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.1
+          docker build  -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.2

      - name: install poetry
        run: |
--- a/.github/workflows/validate_arch_config.yml
+++ b/.github/workflows/validate_arch_config.yml
@ -24,7 +24,7 @@ jobs:

      - name: build arch docker image
        run: |
-          docker build  -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.1
+          docker build  -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.2

      - name: validate arch config
        run: |
--- a/README.md
+++ b/README.md
@ -81,7 +81,7 @@ Arch's CLI allows you to manage and interact with the Arch gateway efficiently.
 ```console
 $ python -m venv venv
 $ source venv/bin/activate   # On Windows, use: venv\Scripts\activate
-$ pip install archgw==0.3.1
+$ pip install archgw==0.3.2
 ```

 ### Build AI Agent with Arch Gateway
--- a/arch/tools/README.md
+++ b/arch/tools/README.md
@ -19,7 +19,7 @@ source venv/bin/activate

 ### Step 3: Run the build script
 ```bash
-pip install archgw==0.3.1
+pip install archgw==0.3.2
 ```

 ## Uninstall Instructions: archgw CLI
--- a/arch/tools/cli/consts.py
+++ b/arch/tools/cli/consts.py
@ -10,4 +10,4 @@ SERVICE_NAME_MODEL_SERVER = "model_server"
 SERVICE_ALL = "all"
 MODEL_SERVER_LOG_FILE = "~/archgw_logs/modelserver.log"
 ARCHGW_DOCKER_NAME = "archgw"
-ARCHGW_DOCKER_IMAGE = os.getenv("ARCHGW_DOCKER_IMAGE", "katanemo/archgw:0.3.1")
+ARCHGW_DOCKER_IMAGE = os.getenv("ARCHGW_DOCKER_IMAGE", "katanemo/archgw:0.3.2")
--- a/arch/tools/pyproject.toml
+++ b/arch/tools/pyproject.toml
@ -1,6 +1,6 @@
 [tool.poetry]
 name = "archgw"
-version = "0.3.1"
+version = "0.3.2"
 description = "Python-based CLI tool to manage Arch Gateway."
 authors = ["Katanemo Labs, Inc."]
 packages = [
@ -10,7 +10,7 @@ readme = "README.md"

 [tool.poetry.dependencies]
 python = "^3.10"
-archgw_modelserver = "^0.3.1"
+archgw_modelserver = "^0.3.2"
 click = "^8.1.7"
 jinja2 = "^3.1.4"
 jsonschema = "^4.23.0"
--- a/build_filter_image.sh
+++ b/build_filter_image.sh
@ -1 +1 @@
-docker build  -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.1
+docker build  -f arch/Dockerfile . -t katanemo/archgw -t katanemo/archgw:0.3.2
--- a/crates/common/src/tokenizer.rs
+++ b/crates/common/src/tokenizer.rs
@ -6,15 +6,21 @@ pub fn token_count(model_name: &str, text: &str) -> Result<usize, String> {
    //HACK: add support for tokenizing mistral and other models
    //filed issue https://github.com/katanemo/arch/issues/222

-    let updated_model = match model_name.starts_with("gpt") {
+    let updated_model = match model_name.starts_with("gpt-4") {
        false => {
            debug!(
                "tiktoken_rs: unsupported model: {}, using gpt-4 to compute token count",
                model_name
            );
-            "gpt-4"
+            "gpt-4o"
+        }
+        true => {
+            if model_name.starts_with("gpt-4.1") {
+                "gpt-4o"
+            } else {
+                model_name
+            }
        }
-        true => model_name,
    };

    // Consideration: is it more expensive to instantiate the BPE object every time, or to contend the singleton?
--- a/demos/use_cases/preference_based_routing/README.md
+++ b/demos/use_cases/preference_based_routing/README.md
@ -14,9 +14,9 @@ Make sure your machine is up to date with [latest version of archgw]([url](https
 2. start archgw in the foreground
 ```bash
 (venv) $ archgw up --service archgw --foreground
-2025-05-30 18:00:09,953 - cli.main - INFO - Starting archgw cli version: 0.3.1
+2025-05-30 18:00:09,953 - cli.main - INFO - Starting archgw cli version: 0.3.2
 2025-05-30 18:00:09,953 - cli.main - INFO - Validating /Users/adilhafeez/src/intelligent-prompt-gateway/demos/use_cases/preference_based_routing/arch_config.yaml
-2025-05-30 18:00:10,422 - cli.core - INFO - Starting arch gateway, image name: archgw, tag: katanemo/archgw:0.3.1
+2025-05-30 18:00:10,422 - cli.core - INFO - Starting arch gateway, image name: archgw, tag: katanemo/archgw:0.3.2
 2025-05-30 18:00:10,662 - cli.core - INFO - archgw status: running, health status: starting
 2025-05-30 18:00:11,712 - cli.core - INFO - archgw status: running, health status: starting
 2025-05-30 18:00:12,761 - cli.core - INFO - archgw is running and is healthy!
--- a/demos/use_cases/preference_based_routing/arch_config.yaml
+++ b/demos/use_cases/preference_based_routing/arch_config.yaml
@ -22,17 +22,17 @@ llm_providers:
    access_key: $OPENAI_API_KEY
    model: gpt-4o-mini

-  - name: gpt-4o
+  - name: gpt-4.1
    provider_interface: openai
    access_key: $OPENAI_API_KEY
-    model: gpt-4o
+    model: gpt-4.1
    default: true

  - name: code_generation
-    provider_interface: openai
-    access_key: $OPENAI_API_KEY
-    model: gpt-4o
-    usage: Generating new code snippets, functions, or boilerplate based on user prompts or requirements
+    access_key: $ANTHROPY_API_KEY
+    provider_interface: claude
+    model: claude-3-7-sonnet-latest
+    usage: generating new code snippets, functions, or boilerplate based on user prompts or requirements

  - name: code_understanding
    provider_interface: openai
--- a/docs/source/conf.py
+++ b/docs/source/conf.py
@ -15,7 +15,7 @@ from sphinxawesome_theme.postprocess import Icons
 project = "Arch Docs"
 copyright = "2025, Katanemo Labs, Inc"
 author = "Katanemo Labs, Inc"
-release = " v0.3.1"
+release = " v0.3.2"

 # -- General configuration ---------------------------------------------------
 # https://www.sphinx-doc.org/en/master/usage/configuration.html#general-configuration
--- a/docs/source/get_started/quickstart.rst
+++ b/docs/source/get_started/quickstart.rst
@ -25,7 +25,7 @@ Arch's CLI allows you to manage and interact with the Arch gateway efficiently.

   $ python -m venv venv
   $ source venv/bin/activate   # On Windows, use: venv\Scripts\activate
-   $ pip install archgw==0.3.1
+   $ pip install archgw==0.3.2


 Build AI Agent with Arch Gateway
--- a/model_server/pyproject.toml
+++ b/model_server/pyproject.toml
@ -1,6 +1,6 @@
 [tool.poetry]
 name = "archgw_modelserver"
-version = "0.3.1"
+version = "0.3.2"
 description = "A model server for serving models"
 authors = ["Katanemo Labs, Inc <info@katanemo.com>"]
 license = "Apache 2.0"