Add docker-compose configuration for inference services
This commit is contained in:
342
open-assistant/docker-compose.yml
Normal file
342
open-assistant/docker-compose.yml
Normal file
@@ -0,0 +1,342 @@
|
||||
version: "3.8"
|
||||
|
||||
services:
|
||||
# Use `docker compose --profile backend-dev up --build --attach-dependencies` to start a database and work and the backend.
|
||||
|
||||
# Use `docker compose --profile frontend-dev up --build --attach-dependencies` to start the services needed to work on the frontend. If you want to also run the inference, add a second `--profile inference` argument.
|
||||
|
||||
# If you update the containers used by the inference profile, please update inference/README.md. Thank you
|
||||
|
||||
# The profile ci is used by CI automations. (i.e E2E testing)
|
||||
|
||||
# This DB is for the FastAPI Backend.
|
||||
db:
|
||||
platform: "${DB_PLATFORM:-}"
|
||||
image: ghcr.io/laion-ai/open-assistant/oasst-postgres
|
||||
pull_policy: always
|
||||
restart: always
|
||||
profiles: ["frontend-dev", "backend-dev", "ci", "inference-dev"]
|
||||
ports:
|
||||
- 5432:5432
|
||||
environment:
|
||||
POSTGRES_USER: postgres
|
||||
POSTGRES_PASSWORD: postgres
|
||||
POSTGRES_DB: postgres
|
||||
healthcheck:
|
||||
test: ["CMD", "pg_isready", "-U", "postgres"]
|
||||
interval: 2s
|
||||
timeout: 2s
|
||||
retries: 10
|
||||
|
||||
# Redis - caching + rate limiting on BE
|
||||
redis:
|
||||
image: redis
|
||||
restart: always
|
||||
profiles: ["frontend-dev", "backend-dev", "ci"]
|
||||
ports:
|
||||
- 6379:6379
|
||||
healthcheck:
|
||||
test: ["CMD-SHELL", "redis-cli ping | grep PONG"]
|
||||
interval: 2s
|
||||
timeout: 2s
|
||||
retries: 10
|
||||
command: redis-server /usr/local/etc/redis/redis.conf
|
||||
volumes:
|
||||
- ./redis.conf:/usr/local/etc/redis/redis.conf
|
||||
# insights host - redis:6379
|
||||
redis-insights:
|
||||
image: redislabs/redisinsight:latest
|
||||
profiles: ["backend-dev"]
|
||||
ports:
|
||||
- 8001:8001
|
||||
|
||||
# This DB is for Web Authentication and data caching.
|
||||
webdb:
|
||||
image: postgres
|
||||
restart: always
|
||||
profiles: ["frontend-dev", "ci", "inference-dev"]
|
||||
ports:
|
||||
- 5433:5432
|
||||
environment:
|
||||
POSTGRES_USER: postgres
|
||||
POSTGRES_PASSWORD: postgres
|
||||
POSTGRES_DB: oasst_web
|
||||
healthcheck:
|
||||
test: ["CMD", "pg_isready", "-U", "postgres"]
|
||||
interval: 2s
|
||||
timeout: 2s
|
||||
retries: 10
|
||||
|
||||
# This lets you manually inspect the web and backend databases.
|
||||
adminer:
|
||||
image: adminer
|
||||
restart: always
|
||||
profiles: ["frontend-dev", "backend-dev"]
|
||||
ports:
|
||||
- 8089:8080
|
||||
|
||||
# This fakes an SMTP email server used by website authentication.
|
||||
# User registration emails can be found by going to localhost:1080 and
|
||||
# opening the emails listed.
|
||||
maildev:
|
||||
image: maildev/maildev
|
||||
restart: always
|
||||
profiles: ["frontend-dev", "ci"]
|
||||
environment:
|
||||
- MAILDEV_WEB_PORT=1080
|
||||
- MAILDEV_SMTP_PORT=1025
|
||||
ports:
|
||||
- "1080:1080"
|
||||
- "1025:1025"
|
||||
|
||||
# The oassist backend service.
|
||||
backend:
|
||||
build:
|
||||
dockerfile: docker/Dockerfile.backend
|
||||
context: .
|
||||
image: oasst-backend
|
||||
environment:
|
||||
- POSTGRES_HOST=db
|
||||
- REDIS_HOST=redis
|
||||
- DEBUG_USE_SEED_DATA=True
|
||||
- DEBUG_ALLOW_SELF_LABELING=True
|
||||
- MAX_WORKERS=1
|
||||
- DEBUG_SKIP_TOXICITY_CALCULATION=False
|
||||
- DEBUG_SKIP_EMBEDDING_COMPUTATION=False
|
||||
- CELERY_BROKER_URL=redis://redis:6379/0
|
||||
- CELERY_RESULT_BACKEND=redis://redis:6379/0
|
||||
depends_on:
|
||||
db:
|
||||
condition: service_healthy
|
||||
profiles: ["frontend-dev", "ci", "inference-dev"]
|
||||
ports:
|
||||
- "8080:8080"
|
||||
|
||||
# The oassist backend celery worker service.
|
||||
backend-worker:
|
||||
build:
|
||||
dockerfile: docker/Dockerfile.backend-worker
|
||||
context: .
|
||||
command: celery -A oasst_backend.celery_worker worker -l info -E
|
||||
image: oasst-backend-worker
|
||||
environment:
|
||||
- CELERY_BROKER_URL=redis://redis:6379/0
|
||||
- CELERY_RESULT_BACKEND=redis://redis:6379/0
|
||||
- POSTGRES_HOST=db
|
||||
- REDIS_HOST=redis
|
||||
- MAX_WORKERS=1
|
||||
depends_on:
|
||||
db:
|
||||
condition: service_healthy
|
||||
redis:
|
||||
condition: service_healthy
|
||||
profiles: ["frontend-dev", "ci"]
|
||||
|
||||
# The oassist backend celery worker service.
|
||||
backend-worker-beat:
|
||||
build:
|
||||
dockerfile: docker/Dockerfile.backend-worker
|
||||
context: .
|
||||
command: celery -A oasst_backend.celery_worker beat -l INFO
|
||||
image: oasst-backend-worker-beat
|
||||
environment:
|
||||
- CELERY_BROKER_URL=redis://redis:6379/0
|
||||
- CELERY_RESULT_BACKEND=redis://redis:6379/0
|
||||
- POSTGRES_HOST=db
|
||||
- REDIS_HOST=redis
|
||||
- MAX_WORKERS=1
|
||||
depends_on:
|
||||
db:
|
||||
condition: service_healthy
|
||||
redis:
|
||||
condition: service_healthy
|
||||
profiles: ["frontend-dev", "ci"]
|
||||
|
||||
# The oassist web service.
|
||||
web:
|
||||
build:
|
||||
dockerfile: docker/Dockerfile.website
|
||||
context: .
|
||||
image: oasst-web
|
||||
environment:
|
||||
- CLOUDFLARE_CAPTCHA_SECRET_KEY=1x0000000000000000000000000000000AA
|
||||
- CLOUDFARE_CAPTCHA_SITE_KEY=1x00000000000000000000AA
|
||||
- DATABASE_URL=postgres://postgres:postgres@webdb/oasst_web
|
||||
- FASTAPI_URL=http://backend:8080
|
||||
- FASTAPI_KEY=1234
|
||||
- NEXTAUTH_SECRET=O/M2uIbGj+lDD2oyNa8ax4jEOJqCPJzO53UbWShmq98=
|
||||
- EMAIL_SERVER_HOST=maildev
|
||||
- EMAIL_SERVER_PORT=1025
|
||||
- EMAIL_FROM=info@example.com
|
||||
- ENABLE_EMAIL_SIGNIN=true
|
||||
- ENABLE_EMAIL_SIGNIN_CAPTCHA=false
|
||||
- NEXTAUTH_URL=http://localhost:3000
|
||||
- DEBUG_LOGIN=true
|
||||
- INFERENCE_SERVER_HOST=http://inference-server:8000
|
||||
- ENABLE_CHAT=true
|
||||
- ENABLE_DRAFTS_WITH_PLUGINS=false
|
||||
- NUM_GENERATED_DRAFTS=3
|
||||
depends_on:
|
||||
webdb:
|
||||
condition: service_healthy
|
||||
ports:
|
||||
- "3000:3000"
|
||||
command: bash wait-for-postgres.sh node server.js
|
||||
profiles: ["ci"]
|
||||
|
||||
# This DB is for Inference
|
||||
inference-db:
|
||||
image: postgres
|
||||
restart: always
|
||||
ports:
|
||||
- 5434:5432
|
||||
environment:
|
||||
POSTGRES_USER: postgres
|
||||
POSTGRES_PASSWORD: postgres
|
||||
POSTGRES_DB: oasst_inference
|
||||
healthcheck:
|
||||
test: ["CMD", "pg_isready", "-U", "postgres"]
|
||||
interval: 2s
|
||||
timeout: 2s
|
||||
retries: 10
|
||||
profiles: ["inference"]
|
||||
|
||||
inference-redis:
|
||||
image: redis
|
||||
restart: always
|
||||
profiles: ["inference"]
|
||||
ports:
|
||||
- 6389:6379
|
||||
healthcheck:
|
||||
test: ["CMD-SHELL", "redis-cli ping | grep PONG"]
|
||||
interval: 2s
|
||||
timeout: 2s
|
||||
retries: 10
|
||||
command: redis-server /usr/local/etc/redis/redis.conf
|
||||
volumes:
|
||||
- ./redis.conf:/usr/local/etc/redis/redis.conf
|
||||
|
||||
inference-server:
|
||||
build:
|
||||
dockerfile: docker/inference/Dockerfile.server
|
||||
context: .
|
||||
target: dev
|
||||
image: oasst-inference-server:dev
|
||||
environment:
|
||||
PORT: 8000
|
||||
REDIS_HOST: inference-redis
|
||||
POSTGRES_HOST: inference-db
|
||||
POSTGRES_DB: oasst_inference
|
||||
DEBUG_API_KEYS: "0000"
|
||||
TRUSTED_CLIENT_KEYS: "6969"
|
||||
ALLOW_DEBUG_AUTH: "True"
|
||||
API_ROOT: "http://localhost:8000"
|
||||
volumes:
|
||||
- "./oasst-shared:/opt/inference/lib/oasst-shared"
|
||||
- "./inference/server:/opt/inference/server"
|
||||
restart: unless-stopped
|
||||
ports:
|
||||
- "8000:8000"
|
||||
depends_on:
|
||||
inference-redis:
|
||||
condition: service_healthy
|
||||
inference-db:
|
||||
condition: service_healthy
|
||||
profiles: ["inference"]
|
||||
|
||||
inference-worker:
|
||||
build:
|
||||
dockerfile: docker/inference/Dockerfile.worker-full
|
||||
context: .
|
||||
image: oasst-inference-worker:dev
|
||||
environment:
|
||||
API_KEY: "0000"
|
||||
MODEL_CONFIG_NAME: ${MODEL_CONFIG_NAME:-distilgpt2}
|
||||
BACKEND_URL: "ws://inference-server:8000"
|
||||
PARALLELISM: 2
|
||||
volumes:
|
||||
- "./oasst-shared:/opt/inference/lib/oasst-shared"
|
||||
- "./inference/worker:/opt/inference/worker"
|
||||
deploy:
|
||||
replicas: 1
|
||||
profiles: ["inference"]
|
||||
|
||||
inference-safety:
|
||||
build:
|
||||
dockerfile: docker/inference/Dockerfile.safety
|
||||
context: .
|
||||
image: oasst-inference-safety:dev
|
||||
environment:
|
||||
PORT: 8002
|
||||
volumes:
|
||||
- "./oasst-shared:/opt/inference/lib/oasst-shared"
|
||||
- "./inference/safety:/opt/inference/safety"
|
||||
profiles: ["inference-safety"]
|
||||
|
||||
prometheus:
|
||||
image: prom/prometheus
|
||||
container_name: prometheus
|
||||
command:
|
||||
- "--config.file=/etc/prometheus/prometheus.yml"
|
||||
ports:
|
||||
- 9090:9090
|
||||
restart: unless-stopped
|
||||
volumes:
|
||||
- ${PWD}/docker/prometheus:/etc/prometheus
|
||||
- prom_data:/prometheus
|
||||
profiles: ["observability"]
|
||||
|
||||
grafana:
|
||||
image: grafana/grafana
|
||||
container_name: grafana
|
||||
ports:
|
||||
- 2000:2000
|
||||
restart: unless-stopped
|
||||
environment:
|
||||
- GF_SECURITY_ADMIN_USER=admin
|
||||
- GF_SECURITY_ADMIN_PASSWORD=grafana
|
||||
- GF_SERVER_HTTP_PORT=2000
|
||||
volumes:
|
||||
- ${PWD}/docker/grafana/datasources:/etc/grafana/provisioning/datasources
|
||||
- ${PWD}/docker/grafana/dashboards/dashboard.yaml:/etc/grafana/provisioning/dashboards/main.yaml
|
||||
- ${PWD}/docker/grafana/dashboards:/var/lib/grafana/dashboards
|
||||
profiles: ["observability"]
|
||||
|
||||
netdata:
|
||||
image: netdata/netdata
|
||||
container_name: netdata
|
||||
pid: host
|
||||
hostname: oasst-netdata
|
||||
ports:
|
||||
- 19999:19999
|
||||
restart: unless-stopped
|
||||
cap_add:
|
||||
- SYS_PTRACE
|
||||
- SYS_ADMIN
|
||||
security_opt:
|
||||
- apparmor:unconfined
|
||||
volumes:
|
||||
- netdataconfig:/etc/netdata
|
||||
- netdatalib:/var/lib/netdata
|
||||
- netdatacache:/var/cache/netdata
|
||||
- /etc/passwd:/host/etc/passwd:ro
|
||||
- /etc/group:/host/etc/group:ro
|
||||
- /proc:/host/proc:ro
|
||||
- /sys:/host/sys:ro
|
||||
- /etc/os-release:/host/etc/os-release:ro
|
||||
- /var/run/docker.sock:/var/run/docker.sock:ro
|
||||
- ${PWD}/docker/netdata/go.d/redis.conf:/etc/netdata/go.d/redis.conf
|
||||
- ${PWD}/docker/netdata/go.d/postgres.conf:/etc/netdata/go.d/postgres.conf
|
||||
- ${PWD}/docker/netdata/go.d/prometheus.conf:/etc/netdata/go.d/prometheus.conf
|
||||
environment:
|
||||
# useful if want to claim monitoring agents into https://www.netdata.cloud/
|
||||
# else ignore or leave blank to just use local netdata dashboards as localhost:19999
|
||||
- NETDATA_CLAIM_TOKEN=${NETDATA_CLAIM_TOKEN:-}
|
||||
- NETDATA_CLAIM_URL=https://app.netdata.cloud
|
||||
profiles: ["observability"]
|
||||
|
||||
volumes:
|
||||
prom_data:
|
||||
netdataconfig:
|
||||
netdatalib:
|
||||
netdatacache:
|
||||
Reference in New Issue
Block a user