better model names (#517)

This commit is contained in:
Adil Hafeez 2025-07-11 16:42:16 -07:00 committed by GitHub
parent 4e2355965b
commit a7fddf30f9
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
55 changed files with 979 additions and 483 deletions

View file

@ -30,21 +30,16 @@ endpoints:
# Centralized way to manage LLMs, manage keys, retry logic, failover and limits in a central way
llm_providers:
- name: OpenAI
provider_interface: openai
- name: openai/gpt-4o
access_key: $OPENAI_API_KEY
model: gpt-4o
model: openai/gpt-4o
default: true
- name: Mistral8x7b
provider_interface: openai
access_key: $MISTRAL_API_KEY
model: mistral-8x7b
- access_key: $MISTRAL_API_KEY
model: mistral/mistral-8x7b
- name: MistralLocal7b
provider_interface: openai
model: mistral-7b-instruct
endpoint: mistral_local
- model: mistral/mistral-7b-instruct
base_url: http://mistral_local
# provides a way to override default settings for the arch system
overrides:

View file

@ -0,0 +1,81 @@
endpoints:
app_server:
connect_timeout: 0.005s
endpoint: 127.0.0.1
port: 80
error_target:
endpoint: error_target_1
port: 80
mistral_local:
endpoint: 127.0.0.1
port: 8001
listeners:
egress_traffic:
address: 0.0.0.0
message_format: openai
port: 12000
timeout: 5s
ingress_traffic:
address: 0.0.0.0
message_format: openai
port: 10000
timeout: 5s
llm_providers:
- access_key: $OPENAI_API_KEY
default: true
model: gpt-4o
name: openai/gpt-4o
provider_interface: openai
- access_key: $MISTRAL_API_KEY
model: mistral-8x7b
name: mistral/mistral-8x7b
provider_interface: mistral
- base_url: http://mistral_local
endpoint: mistral_local
model: mistral-7b-instruct
name: mistral/mistral-7b-instruct
port: 80
protocol: http
provider_interface: mistral
overrides:
prompt_target_intent_matching_threshold: 0.6
prompt_guards:
input_guards:
jailbreak:
on_exception:
message: Looks like you're curious about my abilities, but I can only provide
assistance within my programmed parameters.
prompt_targets:
- auto_llm_dispatch_on_response: true
default: true
description: handel all scenarios that are question and answer in nature. Like summarization,
information extraction, etc.
endpoint:
http_method: POST
name: app_server
path: /agent/summary
name: information_extraction
system_prompt: You are a helpful information extraction assistant. Use the information
that is provided to you.
- description: Reboot a specific network device
endpoint:
name: app_server
path: /agent/action
name: reboot_network_device
parameters:
- description: Identifier of the network device to reboot.
name: device_id
required: true
type: str
- default: false
description: Confirmation flag to proceed with reboot.
enum:
- true
- false
name: confirmation
type: bool
system_prompt: You are a network assistant that just offers facts; not advice on manufacturers
or purchasing decisions.
tracing:
sampling_rate: 0.1
version: v0.1