adding support for claude code routing (#575)

* fixed for claude code routing. first commit

* removing redundant enum tags for cache_control

* making sure that claude code can run via the archgw cli

* fixing broken config

* adding a README.md and updated the cli to use more of our defined patterns for params

* fixed config.yaml

* minor fixes to make sure PR is clean. Ready to ship

* adding claude-sonnet-4-5 to the config

* fixes based on PR

* fixed alias for README

* fixed 400 error handling tests, now that we write temperature to 1.0 for GPT-5

---------

Co-authored-by: Salman Paracha <salmanparacha@MacBook-Pro-257.local>
Co-authored-by: Salman Paracha <salmanparacha@MacBook-Pro-288.local>
This commit is contained in:
Salman Paracha 2025-09-29 19:23:08 -07:00 committed by GitHub
parent 03c2cf6f0d
commit f00870dccb
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
16 changed files with 903 additions and 106 deletions

View file

@ -140,7 +140,7 @@ static_resources:
route:
auto_host_rewrite: true
cluster: {{ llm_cluster_name }}
timeout: 60s
timeout: 300s
{% endfor %}
{% if agent_orchestrator %}
@ -153,7 +153,7 @@ static_resources:
route:
auto_host_rewrite: true
cluster: {{ agent_orchestrator }}
timeout: 60s
timeout: 300s
{% endif %}
http_filters:
- name: envoy.filters.http.compressor
@ -266,7 +266,7 @@ static_resources:
route:
auto_host_rewrite: true
cluster: {{ internal_cluster }}
timeout: 60s
timeout: 300s
{% endfor %}
{% for cluster_name, cluster in arch_clusters.items() %}
@ -279,7 +279,7 @@ static_resources:
route:
auto_host_rewrite: true
cluster: {{ cluster_name }}
timeout: 60s
timeout: 300s
{% endfor %}
http_filters:
- name: envoy.filters.http.router
@ -434,7 +434,7 @@ static_resources:
route:
auto_host_rewrite: true
cluster: {{ llm_cluster_name }}
timeout: 60s
timeout: 300s
{% endfor %}
- match:
prefix: "/"