27 lines
673 B
YAML
27 lines
673 B
YAML
services:
|
|
app:
|
|
build: .
|
|
image: open-llama-image
|
|
container_name: open-llama-container
|
|
volumes:
|
|
- .:/app
|
|
#runtime: nvidia
|
|
deploy:
|
|
resources:
|
|
limits:
|
|
memory: 20G
|
|
reservations:
|
|
devices:
|
|
- driver: nvidia
|
|
count: all
|
|
capabilities: [gpu]
|
|
memory: 20G
|
|
memswap_limit: 60G
|
|
environment:
|
|
- NVIDIA_VISIBLE_DEVICES=all
|
|
- NVIDIA_DRIVER_CAPABILITIES=compute,utility
|
|
- CUDA_DEVICE_ORDER=PCI_BUS_ID
|
|
- CUDA_VISIBLE_DEVICES=0
|
|
- CUDA_LAUNCH_BLOCKING=1
|
|
- TORCH_USE_CUDA_DSA=1
|
|
- PYTORCH_CUDA_ALLOC_CONF=max_split_size_mb:256 |