first add

This commit is contained in:
Your Name
2024-08-02 14:44:39 +08:00
parent 0b0edc3755
commit 968bc3dd24
35 changed files with 3693 additions and 65 deletions

35
docker-compose_m_d.yml Normal file
View File

@@ -0,0 +1,35 @@
services:
ldh-megatron-deepspeed-test:
image: hotwa/magadeep:latest
shm_size: '128gb'
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]
#runtime: nvidia
environment:
- NVIDIA_VISIBLE_DEVICES=all
- NVIDIA_DRIVER_CAPABILITIES=compute,utility
# stdin_open: true
# tty: true
privileged: true
cap_add:
- IPC_LOCK
volumes:
- /root/workspace:/root/data
- /dev/infiniband:/dev/infiniband
# ports:
# - "22242:22242"
# - "5000:5000"
# networks:
# - ldh_overlay_network
network_mode: host
command: ["/usr/sbin/sshd", "-D"]
# networks:
# ldh_overlay_network:
# external: true