mirror of
https://github.com/katanemo/plano.git
synced 2026-05-27 14:17:15 +02:00
fix fc integration (#110)
* fix fc integration * fix integration * remove file * Update arch_fc.py
This commit is contained in:
parent
f0fb4a48cd
commit
ed50d29ccf
3 changed files with 4 additions and 5 deletions
|
|
@ -41,7 +41,7 @@ services:
|
|||
<< : *common-vars
|
||||
environment:
|
||||
- OLLAMA_ENDPOINT=${OLLAMA_ENDPOINT:-host.docker.internal}
|
||||
- FC_URL=${FC_URL:-empty}
|
||||
- FC_URL=${FC_URL:-https://arch-fc-free-trial-4mzywewe.uc.gateway.dev/v1}
|
||||
- OLLAMA_MODEL=Arch-Function-Calling-3B-Q4_K_M
|
||||
- MODE=${MODE:-cloud}
|
||||
# uncomment following line to use ollama endpoint that is hosted by docker
|
||||
|
|
|
|||
|
|
@ -19,7 +19,7 @@ fc_url = os.getenv("FC_URL", ollama_endpoint)
|
|||
mode = os.getenv("MODE", "cloud")
|
||||
if mode not in ["cloud", "local-gpu", "local-cpu"]:
|
||||
raise ValueError(f"Invalid mode: {mode}")
|
||||
arch_api_key = os.getenv("ARCH_API_KEY", "")
|
||||
arch_api_key = os.getenv("ARCH_API_KEY", "vllm")
|
||||
logger = logging.getLogger("uvicorn.error")
|
||||
|
||||
handler = None
|
||||
|
|
|
|||
|
|
@ -1,8 +1,7 @@
|
|||
params:
|
||||
temperature: 0.0001
|
||||
temperature: 0.01
|
||||
top_p : 0.5
|
||||
repetition_penalty: 1.0
|
||||
top_k: 50
|
||||
max_tokens: 128
|
||||
stop: ["<|im_start|>", "<|im_end|>"]
|
||||
max_tokens: 512
|
||||
stop_token_ids: [151645, 151643]
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue