This commit is contained in:
2024-07-15 13:00:45 +08:00
parent ae03ae6b7b
commit 0c6a664069

View File

@@ -4,6 +4,9 @@ services:
build: build:
context: . context: .
dockerfile: Dockerfile.ldh dockerfile: Dockerfile.ldh
args:
HTTP_PROXY: "http://127.0.0.1:15777"
HTTPS_PROXY: "http://127.0.0.1:15777"
image: ldh/deepspeed:test image: ldh/deepspeed:test
shm_size: '32gb' shm_size: '32gb'
deploy: deploy:
@@ -13,28 +16,30 @@ services:
- driver: nvidia - driver: nvidia
count: all count: all
capabilities: [gpu] capabilities: [gpu]
runtime: nvidia #runtime: nvidia
environment: environment:
- NVIDIA_VISIBLE_DEVICES=all - NVIDIA_VISIBLE_DEVICES=all
- NVIDIA_DRIVER_CAPABILITIES=compute,utility - NVIDIA_DRIVER_CAPABILITIES=compute,utility
#- CUTLASS_PATH="/opt/cutlass"
#- CUDA_HOME="/usr/local/cuda"
#- PATH="${CUDA_HOME}/bin:${PATH}"
#- LD_LIBRARY_PATH="${CUDA_HOME}/lib64:${LD_LIBRARY_PATH}"
stdin_open: true stdin_open: true
tty: true tty: true
privileged: true privileged: true
cap_add: cap_add:
- IPC_LOCK - IPC_LOCK
devices:
- /dev/infiniband:/dev/infiniband
volumes: volumes:
- /mnt/local-nvme2:/root/data/local-nvme2 # - /mnt/local-nvme2:/root/workspace
- /mnt/local-nvme:/root/data/local-nvme # - /dev/infiniband:/dev/infiniband
# ports: # - /mnt/local-nvme:/root/
# - "22242:22242" ports:
# - "5000:5000" - "22242:22242"
- "5000:5000"
# networks: # networks:
# - ldh_overlay_network # - ldh_overlay_network
network_mode: host network_mode: host
# command: ["/usr/sbin/sshd", "-D"] command: ["/usr/sbin/sshd", "-D"]
# command: ["/usr/sbin/sshd"]
# networks: # networks:
# ldh_overlay_network: # ldh_overlay_network: