51 lines
1.5 KiB
YAML
51 lines
1.5 KiB
YAML
x-defaults: &defaults
|
|
restart: unless-stopped
|
|
logging:
|
|
driver: json-file
|
|
options:
|
|
max-size: 100m
|
|
max-file: '3'
|
|
|
|
services:
|
|
pytorch:
|
|
<<: *defaults
|
|
image: ${GLOBAL_REGISTRY:-}pytorch/pytorch:${PYTORCH_VERSION:-2.6.0-cuda12.6-cudnn9-runtime}
|
|
ports:
|
|
- '${JUPYTER_PORT_OVERRIDE:-8888}:8888'
|
|
- '${TENSORBOARD_PORT_OVERRIDE:-6006}:6006'
|
|
environment:
|
|
TZ: ${TZ:-UTC}
|
|
NVIDIA_VISIBLE_DEVICES: ${NVIDIA_VISIBLE_DEVICES:-all}
|
|
NVIDIA_DRIVER_CAPABILITIES: ${NVIDIA_DRIVER_CAPABILITIES:-compute,utility}
|
|
JUPYTER_ENABLE_LAB: ${JUPYTER_ENABLE_LAB:-yes}
|
|
command: >
|
|
bash -c "pip install --no-cache-dir jupyter tensorboard &&
|
|
jupyter lab --ip=0.0.0.0 --port=8888 --no-browser --allow-root
|
|
--NotebookApp.token='${JUPYTER_TOKEN:-pytorch}'"
|
|
volumes:
|
|
- pytorch_notebooks:/workspace
|
|
- pytorch_data:/data
|
|
working_dir: /workspace
|
|
deploy:
|
|
resources:
|
|
limits:
|
|
cpus: ${PYTORCH_CPU_LIMIT:-4.0}
|
|
memory: ${PYTORCH_MEMORY_LIMIT:-16G}
|
|
reservations:
|
|
cpus: ${PYTORCH_CPU_RESERVATION:-2.0}
|
|
memory: ${PYTORCH_MEMORY_RESERVATION:-8G}
|
|
devices:
|
|
- driver: nvidia
|
|
count: ${GPU_COUNT:-1}
|
|
capabilities: [gpu]
|
|
healthcheck:
|
|
test: [CMD, wget, --no-verbose, --tries=1, --spider, 'http://localhost:8888/']
|
|
interval: 30s
|
|
timeout: 10s
|
|
retries: 3
|
|
start_period: 60s
|
|
|
|
volumes:
|
|
pytorch_notebooks:
|
|
pytorch_data:
|