fixing failing tests and updating rederend config file

This commit is contained in:
Salman Paracha 2025-09-18 09:51:27 -07:00
parent 79ff4bb164
commit a92e75c5ea
7 changed files with 24 additions and 37 deletions

View file

@ -626,32 +626,6 @@ static_resources:
tls_minimum_protocol_version: TLSv1_2 tls_minimum_protocol_version: TLSv1_2
tls_maximum_protocol_version: TLSv1_3 tls_maximum_protocol_version: TLSv1_3
- name: lambda_ai
connect_timeout: 0.5s
type: LOGICAL_DNS
dns_lookup_family: V4_ONLY
lb_policy: ROUND_ROBIN
load_assignment:
cluster_name: xai
endpoints:
- lb_endpoints:
- endpoint:
address:
socket_address:
address: api.lambda.ai
port_value: 443
hostname: "api.lambda.ai"
transport_socket:
name: envoy.transport_sockets.tls
typed_config:
"@type": type.googleapis.com/envoy.extensions.transport_sockets.tls.v3.UpstreamTlsContext
sni: api.lambda.ai
common_tls_context:
tls_params:
tls_minimum_protocol_version: TLSv1_2
tls_maximum_protocol_version: TLSv1_3
- name: gemini - name: gemini
connect_timeout: 0.5s connect_timeout: 0.5s
type: LOGICAL_DNS type: LOGICAL_DNS

View file

@ -15,7 +15,6 @@ SUPPORTED_PROVIDERS = [
"gemini", "gemini",
"anthropic", "anthropic",
"together_ai", "together_ai",
"lambda_ai",
"azure_openai", "azure_openai",
"xai", "xai",
] ]

View file

@ -171,8 +171,6 @@ pub enum LlmProviderType {
XAI, XAI,
#[serde(rename = "together_ai")] #[serde(rename = "together_ai")]
TogetherAI, TogetherAI,
#[serde(rename = "lambda_ai")]
LambdaAI,
#[serde(rename = "azure_openai")] #[serde(rename = "azure_openai")]
AzureOpenAI, AzureOpenAI,
} }
@ -189,7 +187,6 @@ impl Display for LlmProviderType {
LlmProviderType::OpenAI => write!(f, "openai"), LlmProviderType::OpenAI => write!(f, "openai"),
LlmProviderType::XAI => write!(f, "xai"), LlmProviderType::XAI => write!(f, "xai"),
LlmProviderType::TogetherAI => write!(f, "together_ai"), LlmProviderType::TogetherAI => write!(f, "together_ai"),
LlmProviderType::LambdaAI => write!(f, "lambda_ai"),
LlmProviderType::AzureOpenAI => write!(f, "azure_openai"), LlmProviderType::AzureOpenAI => write!(f, "azure_openai"),
} }
} }

View file

@ -16,7 +16,6 @@ pub enum ProviderId {
AzureOpenAI, AzureOpenAI,
XAI, XAI,
TogetherAI, TogetherAI,
LambdaAI,
} }
impl From<&str> for ProviderId { impl From<&str> for ProviderId {
@ -33,7 +32,6 @@ impl From<&str> for ProviderId {
"azure_openai" => ProviderId::AzureOpenAI, "azure_openai" => ProviderId::AzureOpenAI,
"xai" => ProviderId::XAI, "xai" => ProviderId::XAI,
"together_ai" => ProviderId::TogetherAI, "together_ai" => ProviderId::TogetherAI,
"lambda_ai" => ProviderId::LambdaAI,
_ => panic!("Unknown provider: {}", value), _ => panic!("Unknown provider: {}", value),
} }
} }
@ -57,8 +55,7 @@ impl ProviderId {
| ProviderId::GitHub | ProviderId::GitHub
| ProviderId::AzureOpenAI | ProviderId::AzureOpenAI
| ProviderId::XAI | ProviderId::XAI
| ProviderId::TogetherAI | ProviderId::TogetherAI,
| ProviderId::LambdaAI,
SupportedAPIs::AnthropicMessagesAPI(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions), SupportedAPIs::AnthropicMessagesAPI(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
(ProviderId::OpenAI (ProviderId::OpenAI
@ -70,8 +67,7 @@ impl ProviderId {
| ProviderId::GitHub | ProviderId::GitHub
| ProviderId::AzureOpenAI | ProviderId::AzureOpenAI
| ProviderId::XAI | ProviderId::XAI
| ProviderId::TogetherAI | ProviderId::TogetherAI,
| ProviderId::LambdaAI,
SupportedAPIs::OpenAIChatCompletions(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions), SupportedAPIs::OpenAIChatCompletions(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
} }
} }
@ -91,7 +87,6 @@ impl Display for ProviderId {
ProviderId::AzureOpenAI => write!(f, "azure_openai"), ProviderId::AzureOpenAI => write!(f, "azure_openai"),
ProviderId::XAI => write!(f, "xai"), ProviderId::XAI => write!(f, "xai"),
ProviderId::TogetherAI => write!(f, "together_ai"), ProviderId::TogetherAI => write!(f, "together_ai"),
ProviderId::LambdaAI => write!(f, "lambda_ai"),
} }
} }
} }

View file

@ -37,6 +37,12 @@ llm_providers:
- access_key: $GEMINI_API_KEY - access_key: $GEMINI_API_KEY
model: gemini/gemini-1.5-pro-latest model: gemini/gemini-1.5-pro-latest
- model: xai/grok-4-latest
access_key: $GROK_API_KEY
- model: together_ai/openai/gpt-oss-20b
access_key: $TOGETHER_API_KEY
- model: custom/test-model - model: custom/test-model
base_url: http://host.docker.internal:11223 base_url: http://host.docker.internal:11223
provider_interface: openai provider_interface: openai

View file

@ -41,6 +41,16 @@ llm_providers:
- model: mistral/mistral-7b-instruct - model: mistral/mistral-7b-instruct
base_url: http://mistral_local base_url: http://mistral_local
# Model aliases - friendly names that map to actual provider names
model_aliases:
# Alias for summarization tasks -> fast/cheap model
arch.summarize.v1:
target: gpt-4o
# Alias for general purpose tasks -> latest model
arch.v1:
target: mistral-8x7b
# provides a way to override default settings for the arch system # provides a way to override default settings for the arch system
overrides: overrides:
# By default Arch uses an NLI + embedding approach to match an incoming prompt to a prompt target. # By default Arch uses an NLI + embedding approach to match an incoming prompt to a prompt target.

View file

@ -31,12 +31,18 @@ llm_providers:
name: mistral/mistral-8x7b name: mistral/mistral-8x7b
provider_interface: mistral provider_interface: mistral
- base_url: http://mistral_local - base_url: http://mistral_local
cluster_name: mistral_mistral_local
endpoint: mistral_local endpoint: mistral_local
model: mistral-7b-instruct model: mistral-7b-instruct
name: mistral/mistral-7b-instruct name: mistral/mistral-7b-instruct
port: 80 port: 80
protocol: http protocol: http
provider_interface: mistral provider_interface: mistral
model_aliases:
arch.summarize.v1:
target: gpt-4o
arch.v1:
target: mistral-8x7b
overrides: overrides:
prompt_target_intent_matching_threshold: 0.6 prompt_target_intent_matching_threshold: 0.6
prompt_guards: prompt_guards: