add docker swarm network

This commit is contained in:
Your Name
2024-06-29 06:17:20 +00:00
parent f074dcd44e
commit c6af21a957
2 changed files with 53 additions and 1 deletions

4
.gitignore vendored
View File

@@ -3,4 +3,6 @@ build_d/
*_src
evo_src/
megaDNA_src/
evo/huggingface/
evo/huggingface/
*.zip
finetune/binbbt/

View File

@@ -0,0 +1,50 @@
version: '3.8'
services:
ubuntu-finetune:
build:
context: .
dockerfile: Dockerfile
args:
PYTHON_VERSION: "3.10"
CUDA_VERSION: "12.1.0"
PYTORCH_VERSION: "2.3.0"
TORCHVISION_VERSION: "0.18.0"
TORCHAUDIO_VERSION: "2.3.0"
DS_BUILD_OPS: 1
USE_CUDA: 1
USE_ROCM: 0
USE_XPU: 0
CUDA: cu121
CUDA_ARCH_LIST: "80;86;89;90"
SETUPTOOLS_VERSION: "69.5.1"
DCUTLASS_NVCC_ARCHS: "80;86;89;90;90a"
DEEPSPEED_VERSION: "master"
DEEPSPEED_INSTALL_FLAGS: "--allow_sudo"
volumes:
- ./binbbt:/bbtft
container_name: ubuntu-finetune
pull_policy: if_not_present
restart: unless-stopped
image: hotwa/deepspeed:pt23
shm_size: '40gb'
ports:
- 3228:22
environment:
- NVIDIA_VISIBLE_DEVICES=all
- NVIDIA_DRIVER_CAPABILITIES=compute,utility
- TMPDIR=/var/tmp
networks:
- network_finetune
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]
# 修改为docker-swarm的网络
networks:
test-net:
external: true