2024-10-08 13:18:34 -07:00
|
|
|
version: v0.1
|
2024-09-24 13:54:17 -07:00
|
|
|
|
2024-10-08 13:18:34 -07:00
|
|
|
listen:
|
|
|
|
|
address: 0.0.0.0 # or 127.0.0.1
|
|
|
|
|
port: 10000
|
|
|
|
|
# Defines how Arch should parse the content from application/json or text/pain Content-type in the http request
|
|
|
|
|
message_format: huggingface
|
2024-09-30 14:54:01 -07:00
|
|
|
|
2024-10-08 13:18:34 -07:00
|
|
|
# Centralized way to manage LLMs, manage keys, retry logic, failover and limits in a central way
|
2024-09-30 14:54:01 -07:00
|
|
|
llm_providers:
|
2024-10-08 13:18:34 -07:00
|
|
|
- name: OpenAI
|
|
|
|
|
provider: openai
|
2024-10-06 16:54:34 -07:00
|
|
|
access_key: OPENAI_API_KEY
|
|
|
|
|
model: gpt-4o
|
2024-10-08 13:18:34 -07:00
|
|
|
default: true
|
2024-10-06 16:54:34 -07:00
|
|
|
stream: true
|
2024-09-24 13:54:17 -07:00
|
|
|
|
2024-10-08 13:18:34 -07:00
|
|
|
# default system prompt used by all prompt targets
|
|
|
|
|
system_prompt: You are a network assistant that just offers facts; not advice on manufacturers or purchasing decisions.
|
|
|
|
|
|
2024-09-24 13:54:17 -07:00
|
|
|
prompt_targets:
|
|
|
|
|
- name: reboot_devices
|
2024-10-08 13:18:34 -07:00
|
|
|
description: Reboot specific devices or device groups
|
2024-09-24 13:54:17 -07:00
|
|
|
|
|
|
|
|
path: /agent/device_reboot
|
|
|
|
|
parameters:
|
2024-10-08 13:18:34 -07:00
|
|
|
- name: device_ids
|
|
|
|
|
type: list
|
|
|
|
|
description: A list of device identifiers (IDs) to reboot.
|
2024-09-24 13:54:17 -07:00
|
|
|
required: false
|
2024-10-08 13:18:34 -07:00
|
|
|
- name: device_group
|
|
|
|
|
type: str
|
|
|
|
|
description: The name of the device group to reboot
|
2024-09-24 13:54:17 -07:00
|
|
|
required: false
|
|
|
|
|
|
2024-10-06 16:54:34 -07:00
|
|
|
# Arch creates a round-robin load balancing between different endpoints, managed via the cluster subsystem.
|
|
|
|
|
endpoints:
|
|
|
|
|
app_server:
|
|
|
|
|
# value could be ip address or a hostname with port
|
|
|
|
|
# this could also be a list of endpoints for load balancing
|
|
|
|
|
# for example endpoint: [ ip1:port, ip2:port ]
|
2024-10-08 13:18:34 -07:00
|
|
|
endpoint: 127.0.0.1:80
|
2024-10-06 16:54:34 -07:00
|
|
|
# max time to wait for a connection to be established
|
|
|
|
|
connect_timeout: 0.005s
|