update
This commit is contained in:
26
finetune/docker-compose_nccl.yml
Normal file
26
finetune/docker-compose_nccl.yml
Normal file
@@ -0,0 +1,26 @@
|
|||||||
|
version: '3.8'
|
||||||
|
# https://github.com/mayooot/build-nccl-tests-with-pytorch
|
||||||
|
services:
|
||||||
|
nccl-test-container:
|
||||||
|
image: mayooot/nccl-tests-with-pytorch:v0.0.2
|
||||||
|
container_name: nccl-test-container
|
||||||
|
network_mode: host
|
||||||
|
environment:
|
||||||
|
- PORT=1998
|
||||||
|
- PASS=P@88w0rd
|
||||||
|
volumes:
|
||||||
|
- ./id_rsa_finetune:/root/.ssh/id_rsa
|
||||||
|
- ./id_rsa.pub:/root/.ssh/id_rsa.pub
|
||||||
|
deploy:
|
||||||
|
resources:
|
||||||
|
reservations:
|
||||||
|
devices:
|
||||||
|
- driver: nvidia
|
||||||
|
count: all
|
||||||
|
capabilities: [gpu]
|
||||||
|
cap_add:
|
||||||
|
- IPC_LOCK
|
||||||
|
devices:
|
||||||
|
- /dev/infiniband:/dev/infiniband
|
||||||
|
shm_size: '32gb'
|
||||||
|
restart: unless-stopped
|
||||||
Reference in New Issue
Block a user