mirror of
https://github.com/katanemo/plano.git
synced 2026-06-20 15:28:07 +02:00
fixing failing tests and updating rederend config file
This commit is contained in:
parent
79ff4bb164
commit
a92e75c5ea
7 changed files with 24 additions and 37 deletions
|
|
@ -626,32 +626,6 @@ static_resources:
|
||||||
tls_minimum_protocol_version: TLSv1_2
|
tls_minimum_protocol_version: TLSv1_2
|
||||||
tls_maximum_protocol_version: TLSv1_3
|
tls_maximum_protocol_version: TLSv1_3
|
||||||
|
|
||||||
- name: lambda_ai
|
|
||||||
connect_timeout: 0.5s
|
|
||||||
type: LOGICAL_DNS
|
|
||||||
dns_lookup_family: V4_ONLY
|
|
||||||
lb_policy: ROUND_ROBIN
|
|
||||||
load_assignment:
|
|
||||||
cluster_name: xai
|
|
||||||
endpoints:
|
|
||||||
- lb_endpoints:
|
|
||||||
- endpoint:
|
|
||||||
address:
|
|
||||||
socket_address:
|
|
||||||
address: api.lambda.ai
|
|
||||||
port_value: 443
|
|
||||||
hostname: "api.lambda.ai"
|
|
||||||
transport_socket:
|
|
||||||
name: envoy.transport_sockets.tls
|
|
||||||
typed_config:
|
|
||||||
"@type": type.googleapis.com/envoy.extensions.transport_sockets.tls.v3.UpstreamTlsContext
|
|
||||||
sni: api.lambda.ai
|
|
||||||
common_tls_context:
|
|
||||||
tls_params:
|
|
||||||
tls_minimum_protocol_version: TLSv1_2
|
|
||||||
tls_maximum_protocol_version: TLSv1_3
|
|
||||||
|
|
||||||
|
|
||||||
- name: gemini
|
- name: gemini
|
||||||
connect_timeout: 0.5s
|
connect_timeout: 0.5s
|
||||||
type: LOGICAL_DNS
|
type: LOGICAL_DNS
|
||||||
|
|
|
||||||
|
|
@ -15,7 +15,6 @@ SUPPORTED_PROVIDERS = [
|
||||||
"gemini",
|
"gemini",
|
||||||
"anthropic",
|
"anthropic",
|
||||||
"together_ai",
|
"together_ai",
|
||||||
"lambda_ai",
|
|
||||||
"azure_openai",
|
"azure_openai",
|
||||||
"xai",
|
"xai",
|
||||||
]
|
]
|
||||||
|
|
|
||||||
|
|
@ -171,8 +171,6 @@ pub enum LlmProviderType {
|
||||||
XAI,
|
XAI,
|
||||||
#[serde(rename = "together_ai")]
|
#[serde(rename = "together_ai")]
|
||||||
TogetherAI,
|
TogetherAI,
|
||||||
#[serde(rename = "lambda_ai")]
|
|
||||||
LambdaAI,
|
|
||||||
#[serde(rename = "azure_openai")]
|
#[serde(rename = "azure_openai")]
|
||||||
AzureOpenAI,
|
AzureOpenAI,
|
||||||
}
|
}
|
||||||
|
|
@ -189,7 +187,6 @@ impl Display for LlmProviderType {
|
||||||
LlmProviderType::OpenAI => write!(f, "openai"),
|
LlmProviderType::OpenAI => write!(f, "openai"),
|
||||||
LlmProviderType::XAI => write!(f, "xai"),
|
LlmProviderType::XAI => write!(f, "xai"),
|
||||||
LlmProviderType::TogetherAI => write!(f, "together_ai"),
|
LlmProviderType::TogetherAI => write!(f, "together_ai"),
|
||||||
LlmProviderType::LambdaAI => write!(f, "lambda_ai"),
|
|
||||||
LlmProviderType::AzureOpenAI => write!(f, "azure_openai"),
|
LlmProviderType::AzureOpenAI => write!(f, "azure_openai"),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -16,7 +16,6 @@ pub enum ProviderId {
|
||||||
AzureOpenAI,
|
AzureOpenAI,
|
||||||
XAI,
|
XAI,
|
||||||
TogetherAI,
|
TogetherAI,
|
||||||
LambdaAI,
|
|
||||||
}
|
}
|
||||||
|
|
||||||
impl From<&str> for ProviderId {
|
impl From<&str> for ProviderId {
|
||||||
|
|
@ -33,7 +32,6 @@ impl From<&str> for ProviderId {
|
||||||
"azure_openai" => ProviderId::AzureOpenAI,
|
"azure_openai" => ProviderId::AzureOpenAI,
|
||||||
"xai" => ProviderId::XAI,
|
"xai" => ProviderId::XAI,
|
||||||
"together_ai" => ProviderId::TogetherAI,
|
"together_ai" => ProviderId::TogetherAI,
|
||||||
"lambda_ai" => ProviderId::LambdaAI,
|
|
||||||
_ => panic!("Unknown provider: {}", value),
|
_ => panic!("Unknown provider: {}", value),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
@ -57,8 +55,7 @@ impl ProviderId {
|
||||||
| ProviderId::GitHub
|
| ProviderId::GitHub
|
||||||
| ProviderId::AzureOpenAI
|
| ProviderId::AzureOpenAI
|
||||||
| ProviderId::XAI
|
| ProviderId::XAI
|
||||||
| ProviderId::TogetherAI
|
| ProviderId::TogetherAI,
|
||||||
| ProviderId::LambdaAI,
|
|
||||||
SupportedAPIs::AnthropicMessagesAPI(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
|
SupportedAPIs::AnthropicMessagesAPI(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
|
||||||
|
|
||||||
(ProviderId::OpenAI
|
(ProviderId::OpenAI
|
||||||
|
|
@ -70,8 +67,7 @@ impl ProviderId {
|
||||||
| ProviderId::GitHub
|
| ProviderId::GitHub
|
||||||
| ProviderId::AzureOpenAI
|
| ProviderId::AzureOpenAI
|
||||||
| ProviderId::XAI
|
| ProviderId::XAI
|
||||||
| ProviderId::TogetherAI
|
| ProviderId::TogetherAI,
|
||||||
| ProviderId::LambdaAI,
|
|
||||||
SupportedAPIs::OpenAIChatCompletions(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
|
SupportedAPIs::OpenAIChatCompletions(_)) => SupportedAPIs::OpenAIChatCompletions(OpenAIApi::ChatCompletions),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
@ -91,7 +87,6 @@ impl Display for ProviderId {
|
||||||
ProviderId::AzureOpenAI => write!(f, "azure_openai"),
|
ProviderId::AzureOpenAI => write!(f, "azure_openai"),
|
||||||
ProviderId::XAI => write!(f, "xai"),
|
ProviderId::XAI => write!(f, "xai"),
|
||||||
ProviderId::TogetherAI => write!(f, "together_ai"),
|
ProviderId::TogetherAI => write!(f, "together_ai"),
|
||||||
ProviderId::LambdaAI => write!(f, "lambda_ai"),
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -37,6 +37,12 @@ llm_providers:
|
||||||
- access_key: $GEMINI_API_KEY
|
- access_key: $GEMINI_API_KEY
|
||||||
model: gemini/gemini-1.5-pro-latest
|
model: gemini/gemini-1.5-pro-latest
|
||||||
|
|
||||||
|
- model: xai/grok-4-latest
|
||||||
|
access_key: $GROK_API_KEY
|
||||||
|
|
||||||
|
- model: together_ai/openai/gpt-oss-20b
|
||||||
|
access_key: $TOGETHER_API_KEY
|
||||||
|
|
||||||
- model: custom/test-model
|
- model: custom/test-model
|
||||||
base_url: http://host.docker.internal:11223
|
base_url: http://host.docker.internal:11223
|
||||||
provider_interface: openai
|
provider_interface: openai
|
||||||
|
|
|
||||||
|
|
@ -41,6 +41,16 @@ llm_providers:
|
||||||
- model: mistral/mistral-7b-instruct
|
- model: mistral/mistral-7b-instruct
|
||||||
base_url: http://mistral_local
|
base_url: http://mistral_local
|
||||||
|
|
||||||
|
# Model aliases - friendly names that map to actual provider names
|
||||||
|
model_aliases:
|
||||||
|
# Alias for summarization tasks -> fast/cheap model
|
||||||
|
arch.summarize.v1:
|
||||||
|
target: gpt-4o
|
||||||
|
|
||||||
|
# Alias for general purpose tasks -> latest model
|
||||||
|
arch.v1:
|
||||||
|
target: mistral-8x7b
|
||||||
|
|
||||||
# provides a way to override default settings for the arch system
|
# provides a way to override default settings for the arch system
|
||||||
overrides:
|
overrides:
|
||||||
# By default Arch uses an NLI + embedding approach to match an incoming prompt to a prompt target.
|
# By default Arch uses an NLI + embedding approach to match an incoming prompt to a prompt target.
|
||||||
|
|
|
||||||
|
|
@ -31,12 +31,18 @@ llm_providers:
|
||||||
name: mistral/mistral-8x7b
|
name: mistral/mistral-8x7b
|
||||||
provider_interface: mistral
|
provider_interface: mistral
|
||||||
- base_url: http://mistral_local
|
- base_url: http://mistral_local
|
||||||
|
cluster_name: mistral_mistral_local
|
||||||
endpoint: mistral_local
|
endpoint: mistral_local
|
||||||
model: mistral-7b-instruct
|
model: mistral-7b-instruct
|
||||||
name: mistral/mistral-7b-instruct
|
name: mistral/mistral-7b-instruct
|
||||||
port: 80
|
port: 80
|
||||||
protocol: http
|
protocol: http
|
||||||
provider_interface: mistral
|
provider_interface: mistral
|
||||||
|
model_aliases:
|
||||||
|
arch.summarize.v1:
|
||||||
|
target: gpt-4o
|
||||||
|
arch.v1:
|
||||||
|
target: mistral-8x7b
|
||||||
overrides:
|
overrides:
|
||||||
prompt_target_intent_matching_threshold: 0.6
|
prompt_target_intent_matching_threshold: 0.6
|
||||||
prompt_guards:
|
prompt_guards:
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue