simplify developer getting started experience (#102)

* Fixed build. Now, we have a bare bones version of the docker-compose file with only two services, archgw and archgw-model-server. Tested using CLI

* some pre-commit fixes

* fixed cargo formatting issues

* fixed model server conflict changes

---------

Co-authored-by: Salman Paracha <salmanparacha@MacBook-Pro-261.local>
This commit is contained in:
Salman Paracha 2024-10-01 10:02:23 -07:00 committed by GitHub
parent 41cdef590a
commit 8654d3d5c5
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
20 changed files with 53 additions and 407 deletions

View file

@ -1,43 +1,28 @@
services:
envoy:
image: envoyproxy/envoy:v1.30-latest
hostname: envoy
archgw:
build:
context: ../
dockerfile: arch/Dockerfile
ports:
- "10000:10000"
- "19901:9901"
- "18080:9901"
volumes:
- ./envoy.yaml:/etc/envoy/envoy.yaml
- ./target/wasm32-wasi/release:/etc/envoy/proxy-wasm-plugins
- ${ARCH_CONFIG_FILE}:/config/arch_config.yaml
- /etc/ssl/cert.pem:/etc/ssl/cert.pem
- ./arch_log:/var/log/
depends_on:
qdrant:
condition: service_started
embeddingserver:
archgw_model_server:
condition: service_healthy
embeddingserver:
archgw_model_server:
build:
context: ../embedding-server
context: ../model_server
dockerfile: Dockerfile
ports:
- "18080:80"
- "18081:80"
healthcheck:
test: ["CMD", "curl" ,"http://localhost:80/healthz"]
test: ["CMD", "curl" ,"http://localhost/healthz"]
interval: 5s
retries: 20
qdrant:
image: qdrant/qdrant
hostname: vector-db
ports:
- 16333:6333
- 16334:6334
chatbot-ui:
build:
context: ../chatbot-ui
dockerfile: Dockerfile
ports:
- "18080:8080"
environment:
- CHAT_COMPLETION_ENDPOINT=http://envoy:10000/v1
volumes:
- ~/.cache/huggingface:/root/.cache/huggingface