update
This commit is contained in:
@@ -20,7 +20,7 @@ services:
|
|||||||
ubuntu-finetune:
|
ubuntu-finetune:
|
||||||
build:
|
build:
|
||||||
context: .
|
context: .
|
||||||
dockerfile: Dockerfile.update
|
dockerfile: Dockerfile.zly
|
||||||
args: # PyTorch版本、Python版本与pytorch_lightning版本的对应关系表 https://blog.csdn.net/qq_41813454/article/details/137421822
|
args: # PyTorch版本、Python版本与pytorch_lightning版本的对应关系表 https://blog.csdn.net/qq_41813454/article/details/137421822
|
||||||
PYTHON_VERSION: "3.10"
|
PYTHON_VERSION: "3.10"
|
||||||
GO_VERSION: "1.21.13"
|
GO_VERSION: "1.21.13"
|
||||||
@@ -34,8 +34,8 @@ services:
|
|||||||
USE_ROCM: 0
|
USE_ROCM: 0
|
||||||
USE_XPU: 0
|
USE_XPU: 0
|
||||||
CUDA: "cu121"
|
CUDA: "cu121"
|
||||||
CUDA_ARCH_LIST: "80;90" # for RTX 4090, all : "80;86;89;90"
|
CUDA_ARCH_LIST: "80;89;90" # for RTX 4090, all : "80;86;89;90"
|
||||||
TORCH_CUDA_ARCH_LIST: "8.0;9.0+PTX" # all "6.0;6.1;6.2;7.0;7.5;8.0;8.6;8.9;9.0"
|
TORCH_CUDA_ARCH_LIST: "8.0;8.9;9.0+PTX" # all "6.0;6.1;6.2;7.0;7.5;8.0;8.6;8.9;9.0"
|
||||||
SETUPTOOLS_VERSION: "69.5.1"
|
SETUPTOOLS_VERSION: "69.5.1"
|
||||||
# Hopper (H100): 90a
|
# Hopper (H100): 90a
|
||||||
# Ampere (A100, RTX 30 series): 80
|
# Ampere (A100, RTX 30 series): 80
|
||||||
@@ -43,7 +43,7 @@ services:
|
|||||||
# Volta (V100): 70
|
# Volta (V100): 70
|
||||||
# Pascal (P100, GTX 10 series): 60;61
|
# Pascal (P100, GTX 10 series): 60;61
|
||||||
# Maxwell (GTX 900 series): 50;53
|
# Maxwell (GTX 900 series): 50;53
|
||||||
DCUTLASS_NVCC_ARCHS: "80;90a" # 90a for H100 GPU 89:GeForce RTX 4090
|
DCUTLASS_NVCC_ARCHS: "80;89,90a" # 90a for H100 GPU 89:GeForce RTX 4090
|
||||||
DEEPSPEED_VERSION: "master"
|
DEEPSPEED_VERSION: "master"
|
||||||
DEEPSPEED_INSTALL_FLAGS: "--allow_sudo"
|
DEEPSPEED_INSTALL_FLAGS: "--allow_sudo"
|
||||||
# HTTP_PROXY: "http://127.0.0.1:15777"
|
# HTTP_PROXY: "http://127.0.0.1:15777"
|
||||||
@@ -69,18 +69,18 @@ services:
|
|||||||
cap_add:
|
cap_add:
|
||||||
- ALL
|
- ALL
|
||||||
- CAP_SYS_PTRACE
|
- CAP_SYS_PTRACE
|
||||||
shm_size: '63gb'
|
shm_size: '32gb'
|
||||||
devices:
|
# devices:
|
||||||
- /dev/infiniband/rdma_cm
|
# - /dev/infiniband/rdma_cm
|
||||||
- /dev/infiniband/uverbs0
|
# - /dev/infiniband/uverbs0
|
||||||
- /dev/infiniband/uverbs1
|
# - /dev/infiniband/uverbs1
|
||||||
- /dev/infiniband/uverbs2
|
# - /dev/infiniband/uverbs2
|
||||||
- /dev/infiniband/uverbs3
|
# - /dev/infiniband/uverbs3
|
||||||
- /dev/infiniband/uverbs4
|
# - /dev/infiniband/uverbs4
|
||||||
- /dev/infiniband/uverbs5
|
# - /dev/infiniband/uverbs5
|
||||||
- /dev/infiniband/uverbs6
|
# - /dev/infiniband/uverbs6
|
||||||
- /dev/infiniband/uverbs7
|
# - /dev/infiniband/uverbs7
|
||||||
- /dev/infiniband/uverbs8
|
# - /dev/infiniband/uverbs8
|
||||||
ipc: host
|
ipc: host
|
||||||
# ports:
|
# ports:
|
||||||
# - 3228:2222
|
# - 3228:2222
|
||||||
|
|||||||
Reference in New Issue
Block a user