-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdocker-compose.gpu.yml
More file actions
33 lines (31 loc) · 944 Bytes
/
docker-compose.gpu.yml
File metadata and controls
33 lines (31 loc) · 944 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
version: "3.9"
# GPU override for genome-model-service with evo2_40b.
# Usage: docker compose -f docker-compose.yml -f docker-compose.gpu.yml up --build
#
# Requirements:
# - NVIDIA driver ≥ 545 (CUDA 12.4+)
# - nvidia-container-toolkit installed
# - ≥ 80 GB VRAM (2× H100/A100 80GB) for evo2_40b
# - Set HUGGINGFACE_TOKEN in .env if the model repository is gated
#
# For evo2_7b (single A100/H100 40GB+):
# Change EVO2_MODEL_NAME to evo2_7b
services:
genome-model-service:
build:
context: ./apps/genome-model-service
dockerfile: Dockerfile.gpu
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]
environment:
EVO2_PROVIDER: local
EVO2_MODEL_NAME: evo2_40b
EVO2_DEVICE: cuda:0
volumes:
- evo2-model-cache:/root/.cache/evo2
- hf-model-cache:/root/.cache/huggingface