mirror of
https://github.com/katanemo/plano.git
synced 2026-06-17 15:25:17 +02:00
add comments for v1.1 archfc model endpoint
This commit is contained in:
parent
9b538ff074
commit
8b9f48ce9b
2 changed files with 8 additions and 0 deletions
|
|
@ -30,5 +30,11 @@ llm_providers:
|
|||
model: deepseek-reasoner
|
||||
base_url: https://api.deepseek.com/
|
||||
|
||||
- name: groq
|
||||
access_key: $GROQ_API_KEY
|
||||
provider_interface: openai
|
||||
model: llama-3.1-8b-instant
|
||||
base_url: https://api.groq.com
|
||||
|
||||
tracing:
|
||||
random_sampling: 100
|
||||
|
|
|
|||
|
|
@ -16,6 +16,8 @@ logger = get_model_server_logger()
|
|||
|
||||
# Define the client
|
||||
# ARCH_ENDPOINT = os.getenv("ARCH_ENDPOINT", "https://archfc.katanemo.dev/v1")
|
||||
# use temporary endpoint until we deprecate archfc-v1.0 from archfc.katanemo.dev
|
||||
# and officially release archfc-v1.1 on archfc.katanemo.dev
|
||||
ARCH_ENDPOINT = os.getenv("ARCH_ENDPOINT", "http://34.72.123.163:8000/v1")
|
||||
ARCH_API_KEY = "EMPTY"
|
||||
ARCH_CLIENT = OpenAI(base_url=ARCH_ENDPOINT, api_key=ARCH_API_KEY)
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue