mirror of
https://github.com/katanemo/plano.git
synced 2026-06-17 15:25:17 +02:00
fixing failing tests and updating rederend config file
This commit is contained in:
parent
79ff4bb164
commit
a92e75c5ea
7 changed files with 24 additions and 37 deletions
|
|
@ -626,32 +626,6 @@ static_resources:
|
|||
tls_minimum_protocol_version: TLSv1_2
|
||||
tls_maximum_protocol_version: TLSv1_3
|
||||
|
||||
- name: lambda_ai
|
||||
connect_timeout: 0.5s
|
||||
type: LOGICAL_DNS
|
||||
dns_lookup_family: V4_ONLY
|
||||
lb_policy: ROUND_ROBIN
|
||||
load_assignment:
|
||||
cluster_name: xai
|
||||
endpoints:
|
||||
- lb_endpoints:
|
||||
- endpoint:
|
||||
address:
|
||||
socket_address:
|
||||
address: api.lambda.ai
|
||||
port_value: 443
|
||||
hostname: "api.lambda.ai"
|
||||
transport_socket:
|
||||
name: envoy.transport_sockets.tls
|
||||
typed_config:
|
||||
"@type": type.googleapis.com/envoy.extensions.transport_sockets.tls.v3.UpstreamTlsContext
|
||||
sni: api.lambda.ai
|
||||
common_tls_context:
|
||||
tls_params:
|
||||
tls_minimum_protocol_version: TLSv1_2
|
||||
tls_maximum_protocol_version: TLSv1_3
|
||||
|
||||
|
||||
- name: gemini
|
||||
connect_timeout: 0.5s
|
||||
type: LOGICAL_DNS
|
||||
|
|
|
|||
|
|
@ -15,7 +15,6 @@ SUPPORTED_PROVIDERS = [
|
|||
"gemini",
|
||||
"anthropic",
|
||||
"together_ai",
|
||||
"lambda_ai",
|
||||
"azure_openai",
|
||||
"xai",
|
||||
]
|
||||
|
|
|
|||
|
|
@ -171,8 +171,6 @@ pub enum LlmProviderType {
|
|||
XAI,
|
||||
#[serde(rename = "together_ai")]
|
||||
TogetherAI,
|
||||
#[serde(rename = "lambda_ai")]
|
||||
LambdaAI,
|
||||
#[serde(rename = "azure_openai")]
|
||||
AzureOpenAI,
|
||||
}
|
||||
|
|
@ -189,7 +187,6 @@ impl Display for LlmProviderType {
|
|||
LlmProviderType::OpenAI => write!(f, "openai"),
|
||||
LlmProviderType::XAI => write!(f, "xai"),
|
||||
LlmProviderType::TogetherAI => write!(f, "together_ai"),
|
||||
LlmProviderType::LambdaAI => write!(f, "lambda_ai"),
|
||||
LlmProviderType::AzureOpenAI => write!(f, "azure_openai"),
|
||||
}
|
||||
}
|
||||
|
|
|
|||
|
|
@ -16,7 +16,6 @@ pub enum ProviderId {
|
|||
AzureOpenAI,
|
||||
XAI,
|
||||
TogetherAI,
|
||||
LambdaAI,
|
||||
}
|
||||
|
||||
impl From<&str> for ProviderId {
|
||||
|
|
@ -33,7 +32,6 @@ impl From<&str> for ProviderId {
|
|||
"azure_openai" => ProviderId::AzureOpenAI,
|
||||
"xai" => ProviderId::XAI,
|
||||
"together_ai" => ProviderId::TogetherAI,
|
||||
"lambda_ai" => ProviderId::LambdaAI,
|
||||
_ => panic!("Unknown provider: {}", value),
|
||||
}
|
||||
}
|
||||
|
|
@ -57,8 +55,7 @@ impl ProviderId {
|
|||
| ProviderId::GitHub
|
||||
| ProviderId::AzureOpenAI
|
||||
| ProviderId::XAI
|
||||
| ProviderId::TogetherAI
|
||||
| ProviderId::LambdaAI,
|
||||
| ProviderId::TogetherAI,
|
||||
SupportedAPIs::AnthropicMessagesAPI(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
|
||||
|
||||
(ProviderId::OpenAI
|
||||
|
|
@ -70,8 +67,7 @@ impl ProviderId {
|
|||
| ProviderId::GitHub
|
||||
| ProviderId::AzureOpenAI
|
||||
| ProviderId::XAI
|
||||
| ProviderId::TogetherAI
|
||||
| ProviderId::LambdaAI,
|
||||
| ProviderId::TogetherAI,
|
||||
SupportedAPIs::OpenAIChatCompletions(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
|
||||
}
|
||||
}
|
||||
|
|
@ -91,7 +87,6 @@ impl Display for ProviderId {
|
|||
ProviderId::AzureOpenAI => write!(f, "azure_openai"),
|
||||
ProviderId::XAI => write!(f, "xai"),
|
||||
ProviderId::TogetherAI => write!(f, "together_ai"),
|
||||
ProviderId::LambdaAI => write!(f, "lambda_ai"),
|
||||
}
|
||||
}
|
||||
}
|
||||
|
|
|
|||
|
|
@ -37,6 +37,12 @@ llm_providers:
|
|||
- access_key: $GEMINI_API_KEY
|
||||
model: gemini/gemini-1.5-pro-latest
|
||||
|
||||
- model: xai/grok-4-latest
|
||||
access_key: $GROK_API_KEY
|
||||
|
||||
- model: together_ai/openai/gpt-oss-20b
|
||||
access_key: $TOGETHER_API_KEY
|
||||
|
||||
- model: custom/test-model
|
||||
base_url: http://host.docker.internal:11223
|
||||
provider_interface: openai
|
||||
|
|
|
|||
|
|
@ -41,6 +41,16 @@ llm_providers:
|
|||
- model: mistral/mistral-7b-instruct
|
||||
base_url: http://mistral_local
|
||||
|
||||
# Model aliases - friendly names that map to actual provider names
|
||||
model_aliases:
|
||||
# Alias for summarization tasks -> fast/cheap model
|
||||
arch.summarize.v1:
|
||||
target: gpt-4o
|
||||
|
||||
# Alias for general purpose tasks -> latest model
|
||||
arch.v1:
|
||||
target: mistral-8x7b
|
||||
|
||||
# provides a way to override default settings for the arch system
|
||||
overrides:
|
||||
# By default Arch uses an NLI + embedding approach to match an incoming prompt to a prompt target.
|
||||
|
|
|
|||
|
|
@ -31,12 +31,18 @@ llm_providers:
|
|||
name: mistral/mistral-8x7b
|
||||
provider_interface: mistral
|
||||
- base_url: http://mistral_local
|
||||
cluster_name: mistral_mistral_local
|
||||
endpoint: mistral_local
|
||||
model: mistral-7b-instruct
|
||||
name: mistral/mistral-7b-instruct
|
||||
port: 80
|
||||
protocol: http
|
||||
provider_interface: mistral
|
||||
model_aliases:
|
||||
arch.summarize.v1:
|
||||
target: gpt-4o
|
||||
arch.v1:
|
||||
target: mistral-8x7b
|
||||
overrides:
|
||||
prompt_target_intent_matching_threshold: 0.6
|
||||
prompt_guards:
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue