services: ldh-deepspeed-test: build: context: . dockerfile: Dockerfile.ldh args: HTTP_PROXY: "http://127.0.0.1:15777" HTTPS_PROXY: "http://127.0.0.1:15777" image: ldh/deepspeed:test shm_size: '32gb' deploy: resources: reservations: devices: - driver: nvidia count: all capabilities: [gpu] #runtime: nvidia environment: - NVIDIA_VISIBLE_DEVICES=all - NVIDIA_DRIVER_CAPABILITIES=compute,utility #- CUTLASS_PATH="/opt/cutlass" #- CUDA_HOME="/usr/local/cuda" #- PATH="${CUDA_HOME}/bin:${PATH}" #- LD_LIBRARY_PATH="${CUDA_HOME}/lib64:${LD_LIBRARY_PATH}" stdin_open: true tty: true privileged: true cap_add: - IPC_LOCK volumes: # - /mnt/local-nvme2:/root/workspace # - /dev/infiniband:/dev/infiniband # - /mnt/local-nvme:/root/ ports: - "22242:22242" - "5000:5000" # networks: # - ldh_overlay_network network_mode: host command: ["/usr/sbin/sshd", "-D"] # networks: # ldh_overlay_network: # external: true