fix fc integration (#110)

* fix fc integration

* fix integration

* remove file

* Update arch_fc.py
This commit is contained in:
Co Tran 2024-10-01 19:20:28 -07:00 committed by GitHub
parent f0fb4a48cd
commit ed50d29ccf
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
3 changed files with 4 additions and 5 deletions

View file

@ -41,7 +41,7 @@ services:
<< : *common-vars
environment:
- OLLAMA_ENDPOINT=${OLLAMA_ENDPOINT:-host.docker.internal}
- FC_URL=${FC_URL:-empty}
- FC_URL=${FC_URL:-https://arch-fc-free-trial-4mzywewe.uc.gateway.dev/v1}
- OLLAMA_MODEL=Arch-Function-Calling-3B-Q4_K_M
- MODE=${MODE:-cloud}
# uncomment following line to use ollama endpoint that is hosted by docker

View file

@ -19,7 +19,7 @@ fc_url = os.getenv("FC_URL", ollama_endpoint)
mode = os.getenv("MODE", "cloud")
if mode not in ["cloud", "local-gpu", "local-cpu"]:
raise ValueError(f"Invalid mode: {mode}")
arch_api_key = os.getenv("ARCH_API_KEY", "")
arch_api_key = os.getenv("ARCH_API_KEY", "vllm")
logger = logging.getLogger("uvicorn.error")
handler = None

View file

@ -1,8 +1,7 @@
params:
temperature: 0.0001
temperature: 0.01
top_p : 0.5
repetition_penalty: 1.0
top_k: 50
max_tokens: 128
stop: ["<|im_start|>", "<|im_end|>"]
max_tokens: 512
stop_token_ids: [151645, 151643]