mirror of
https://github.com/katanemo/plano.git
synced 2026-04-25 00:36:34 +02:00
ArchFC endpoint integration (#94)
* integration * mopdify docker file * add params and fix python lint * fix empty context and tool calls * address comments * revert port * fix bug merge * fix environment * fix bug * fix compose * fix merge
This commit is contained in:
parent
1a7c1ad0a5
commit
17a643c410
9 changed files with 98 additions and 41 deletions
|
|
@ -1,3 +1,9 @@
|
|||
|
||||
x-variables: &common-vars
|
||||
environment:
|
||||
- MODE=${MODE:-cloud} # Set the default mode to 'cloud', others values are local-gpu, local-cpu
|
||||
|
||||
|
||||
services:
|
||||
|
||||
arch:
|
||||
|
|
@ -11,7 +17,10 @@ services:
|
|||
- ./generated/envoy.yaml:/etc/envoy/envoy.yaml
|
||||
- /etc/ssl/cert.pem:/etc/ssl/cert.pem
|
||||
- ./arch_log:/var/log/
|
||||
- ./arch_config.yaml:/root/arch_config.yaml
|
||||
depends_on:
|
||||
# config_generator:
|
||||
# condition: service_completed_successfully
|
||||
model_server:
|
||||
condition: service_healthy
|
||||
environment:
|
||||
|
|
@ -30,14 +39,15 @@ services:
|
|||
volumes:
|
||||
- ~/.cache/huggingface:/root/.cache/huggingface
|
||||
- ./arch_config.yaml:/root/arch_config.yaml
|
||||
<< : *common-vars
|
||||
environment:
|
||||
- OLLAMA_ENDPOINT=${OLLAMA_ENDPOINT:-host.docker.internal}
|
||||
- FC_URL=${FC_URL:-empty}
|
||||
- OLLAMA_MODEL=Arch-Function-Calling-3B-Q4_K_M
|
||||
# use ollama endpoint that is hosted by host machine (no virtualization)
|
||||
- MODE=${MODE:-cloud}
|
||||
# uncomment following line to use ollama endpoint that is hosted by docker
|
||||
# - OLLAMA_ENDPOINT=ollama
|
||||
# - OLLAMA_MODEL=Arch-Function-Calling-1.5B:Q4_K_M
|
||||
|
||||
api_server:
|
||||
build:
|
||||
context: api_server
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue