This commit is contained in:
2024-06-21 15:12:44 +08:00
parent 5c6e2f44e5
commit be77975ce2
7 changed files with 20 additions and 900 deletions

View File

@@ -317,7 +317,7 @@ cd ..
EOT
# CUDA_ARCH_LIST="80;86;89;90"
ARG DEEPSPEED_VERSION="0.8.3"
ARG DEEPSPEED_VERSION="0.14.3"
ENV DEEPSPEED_VERSION=${DEEPSPEED_VERSION}
ARG DEEPSPEED_INSTALL_FLAGS="--allow_sudo --pip_sudo --no_clean"
ENV DEEPSPEED_INSTALL_FLAGS=${DEEPSPEED_INSTALL_FLAGS}
@@ -339,7 +339,7 @@ source /opt/conda/etc/profile.d/conda.sh
conda activate ${CONDA_ENV_NAME}
python -m pip install setuptools==${SETUPTOOLS_VERSION}
# install oneapi for deepspeed
git clone https://github.com/oneapi-src/oneCCL.git ${STAGE_DIR}/oneCCL
git clone https://ghproxy.dockless.eu.org/https://github.com/oneapi-src/oneCCL.git ${STAGE_DIR}/oneCCL
cd ${STAGE_DIR}/oneCCL
git checkout .
git checkout master
@@ -347,15 +347,27 @@ mkdir build
cd build
cmake .. -DCMAKE_INSTALL_PREFIX=/usr/local
make -j"$(nproc)" install
git clone https://github.com/microsoft/DeepSpeed-Kernels.git ${STAGE_DIR}/DeepSpeed-Kernels
EOT
RUN <<EOT
#!/bin/bash
source /opt/conda/etc/profile.d/conda.sh
conda activate ${CONDA_ENV_NAME}
git clone https://ghproxy.dockless.eu.org/https://github.com/microsoft/DeepSpeed-Kernels.git ${STAGE_DIR}/DeepSpeed-Kernels
cd ${STAGE_DIR}/DeepSpeed-Kernels
CUDA_ARCH_LIST=${CUDA_ARCH_LIST} python setup.py bdist_wheel
pip install dist/deepspeed_kernels-*.whl
# CUDA_ARCH_LIST=${CUDA_ARCH_LIST} pip install -v .
git clone https://github.com/microsoft/DeepSpeed.git ${STAGE_DIR}/DeepSpeed
EOT
RUN <<EOT
#!/bin/bash
source /opt/conda/etc/profile.d/conda.sh
conda activate ${CONDA_ENV_NAME}
git clone https://ghproxy.dockless.eu.org/https://github.com/microsoft/DeepSpeed.git ${STAGE_DIR}/DeepSpeed
cd ${STAGE_DIR}/DeepSpeed
git checkout .
git checkout v0.8.3
# git checkout v${DEEPSPEED_VERSION}
python setup.py bdist_wheel
DS_BUILD_OPS=${DS_BUILD_OPS} pip install dist/deepspeed*.whl --force-reinstall
# DS_BUILD_OPS=${DS_BUILD_OPS} pip install -r requirements/requirements.txt