version: '3.8' services: ubuntu-evo: build: context: . dockerfile: Dockerfile args: # PyTorch版本、Python版本与pytorch_lightning版本的对应关系表 https://blog.csdn.net/qq_41813454/article/details/137421822 CONDA_ENV_NAME: evo CUDA_VERSION: 11.7.1 PYTORCH_VERSION: 1.13.1 TORCHVISION_VERSION: 0.14.1 TORCHAUDIO_VERSION: 0.13.1 DS_BUILD_OPS: 1 DS_BUILD_SPARSE_ATTN: 0 DS_BUILD_FUSED_ADAM: 0 DS_BUILD_CPU_ADAM: 0 CUDA: cu117 CUDA_ARCH_LIST: "80;86;89;90" # for RTX 4090, all : "80;86;89;90" SETUPTOOLS_VERSION: "69.5.1" ROOT_PASSWD: "root" volumes: - ./src:/bbtft container_name: ubuntu-evo pull_policy: if_not_present tty: true restart: unless-stopped image: hotwa/deepspeed:test shm_size: '32gb' ports: - 3227:2222 command: ["/usr/sbin/sshd", "-D"] environment: - NVIDIA_VISIBLE_DEVICES=all - NVIDIA_DRIVER_CAPABILITIES=compute,utility networks: - network_evo deploy: resources: reservations: devices: - driver: nvidia count: all capabilities: [gpu] networks: network_evo: name: network_evo