fixing failing tests and updating rederend config file

This commit is contained in:
Salman Paracha 2025-09-18 09:51:27 -07:00
parent 79ff4bb164
commit a92e75c5ea
7 changed files with 24 additions and 37 deletions

View file

@ -626,32 +626,6 @@ static_resources:
tls_minimum_protocol_version: TLSv1_2
tls_maximum_protocol_version: TLSv1_3
- name: lambda_ai
connect_timeout: 0.5s
type: LOGICAL_DNS
dns_lookup_family: V4_ONLY
lb_policy: ROUND_ROBIN
load_assignment:
cluster_name: xai
endpoints:
- lb_endpoints:
- endpoint:
address:
socket_address:
address: api.lambda.ai
port_value: 443
hostname: "api.lambda.ai"
transport_socket:
name: envoy.transport_sockets.tls
typed_config:
"@type": type.googleapis.com/envoy.extensions.transport_sockets.tls.v3.UpstreamTlsContext
sni: api.lambda.ai
common_tls_context:
tls_params:
tls_minimum_protocol_version: TLSv1_2
tls_maximum_protocol_version: TLSv1_3
- name: gemini
connect_timeout: 0.5s
type: LOGICAL_DNS

View file

@ -15,7 +15,6 @@ SUPPORTED_PROVIDERS = [
"gemini",
"anthropic",
"together_ai",
"lambda_ai",
"azure_openai",
"xai",
]

View file

@ -171,8 +171,6 @@ pub enum LlmProviderType {
XAI,
#[serde(rename = "together_ai")]
TogetherAI,
#[serde(rename = "lambda_ai")]
LambdaAI,
#[serde(rename = "azure_openai")]
AzureOpenAI,
}
@ -189,7 +187,6 @@ impl Display for LlmProviderType {
LlmProviderType::OpenAI => write!(f, "openai"),
LlmProviderType::XAI => write!(f, "xai"),
LlmProviderType::TogetherAI => write!(f, "together_ai"),
LlmProviderType::LambdaAI => write!(f, "lambda_ai"),
LlmProviderType::AzureOpenAI => write!(f, "azure_openai"),
}
}

View file

@ -16,7 +16,6 @@ pub enum ProviderId {
AzureOpenAI,
XAI,
TogetherAI,
LambdaAI,
}
impl From<&str> for ProviderId {
@ -33,7 +32,6 @@ impl From<&str> for ProviderId {
"azure_openai" => ProviderId::AzureOpenAI,
"xai" => ProviderId::XAI,
"together_ai" => ProviderId::TogetherAI,
"lambda_ai" => ProviderId::LambdaAI,
_ => panic!("Unknown provider: {}", value),
}
}
@ -57,8 +55,7 @@ impl ProviderId {
| ProviderId::GitHub
| ProviderId::AzureOpenAI
| ProviderId::XAI
| ProviderId::TogetherAI
| ProviderId::LambdaAI,
| ProviderId::TogetherAI,
SupportedAPIs::AnthropicMessagesAPI(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
(ProviderId::OpenAI
@ -70,8 +67,7 @@ impl ProviderId {
| ProviderId::GitHub
| ProviderId::AzureOpenAI
| ProviderId::XAI
| ProviderId::TogetherAI
| ProviderId::LambdaAI,
| ProviderId::TogetherAI,
SupportedAPIs::OpenAIChatCompletions(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
}
}
@ -91,7 +87,6 @@ impl Display for ProviderId {
ProviderId::AzureOpenAI => write!(f, "azure_openai"),
ProviderId::XAI => write!(f, "xai"),
ProviderId::TogetherAI => write!(f, "together_ai"),
ProviderId::LambdaAI => write!(f, "lambda_ai"),
}
}
}

View file

@ -37,6 +37,12 @@ llm_providers:
- access_key: $GEMINI_API_KEY
model: gemini/gemini-1.5-pro-latest
- model: xai/grok-4-latest
access_key: $GROK_API_KEY
- model: together_ai/openai/gpt-oss-20b
access_key: $TOGETHER_API_KEY
- model: custom/test-model
base_url: http://host.docker.internal:11223
provider_interface: openai

View file

@ -41,6 +41,16 @@ llm_providers:
- model: mistral/mistral-7b-instruct
base_url: http://mistral_local
# Model aliases - friendly names that map to actual provider names
model_aliases:
# Alias for summarization tasks -> fast/cheap model
arch.summarize.v1:
target: gpt-4o
# Alias for general purpose tasks -> latest model
arch.v1:
target: mistral-8x7b
# provides a way to override default settings for the arch system
overrides:
# By default Arch uses an NLI + embedding approach to match an incoming prompt to a prompt target.

View file

@ -31,12 +31,18 @@ llm_providers:
name: mistral/mistral-8x7b
provider_interface: mistral
- base_url: http://mistral_local
cluster_name: mistral_mistral_local
endpoint: mistral_local
model: mistral-7b-instruct
name: mistral/mistral-7b-instruct
port: 80
protocol: http
provider_interface: mistral
model_aliases:
arch.summarize.v1:
target: gpt-4o
arch.v1:
target: mistral-8x7b
overrides:
prompt_target_intent_matching_threshold: 0.6
prompt_guards: