diff --git a/finetune/Dockerfile.update b/finetune/Dockerfile.update index e47103e..52eb7a1 100644 --- a/finetune/Dockerfile.update +++ b/finetune/Dockerfile.update @@ -366,43 +366,6 @@ else fi eval $INSTALL_CMD # compile deepspeed ops -cat <<'EOF' >> ~/.bashrc -source ~/micromamba/etc/profile.d/micromamba.sh -echo "alias mamba=micromamba" >> ~/.bashrc -echo "alias mba=mamba" >> ~/.bashrc -EOF -# 配置 .mambarc 文件 -cat < ~/compile_deepspeed_ops.py -import deepspeed - -def compile_ops(): - builders = [ - deepspeed.ops.op_builder.AsyncIOBuilder, - deepspeed.ops.op_builder.FusedAdamBuilder, - deepspeed.ops.op_builder.CPUAdamBuilder, - deepspeed.ops.op_builder.CPUAdagradBuilder, - deepspeed.ops.op_builder.CPULionBuilder, - deepspeed.ops.op_builder.EvoformerAttnBuilder, - deepspeed.ops.op_builder.FPQuantizerBuilder, - deepspeed.ops.op_builder.FusedLambBuilder, - deepspeed.ops.op_builder.FusedLionBuilder, - deepspeed.ops.op_builder.QuantizerBuilder, - deepspeed.ops.op_builder.RaggedOpsBuilder, - deepspeed.ops.op_builder.RandomLTDBuilder, - deepspeed.ops.op_builder.SparseAttnBuilder, - deepspeed.ops.op_builder.SpatialInferenceBuilder, - deepspeed.ops.op_builder.TransformerBuilder, - deepspeed.ops.op_builder.StochasticTransformerBuilder, - ] - - for builder in builders: - print(f"Compiling {builder.__name__}") - builder().load() - -if __name__ == "__main__": - compile_ops() -EOF -python compile_deepspeed_ops.py ds_report # clean up # rm -f deepspeed/git_version_info_installed.py diff --git a/finetune/README.md b/finetune/README.md index ec3ad7f..d5dfb35 100644 --- a/finetune/README.md +++ b/finetune/README.md @@ -24,6 +24,40 @@ mst version mpirun --version ``` +```shell +cat < ~/compile_deepspeed_ops.py +import deepspeed + +def compile_ops(): + builders = [ + deepspeed.ops.op_builder.AsyncIOBuilder, + deepspeed.ops.op_builder.FusedAdamBuilder, + deepspeed.ops.op_builder.CPUAdamBuilder, + deepspeed.ops.op_builder.CPUAdagradBuilder, + deepspeed.ops.op_builder.CPULionBuilder, + deepspeed.ops.op_builder.EvoformerAttnBuilder, + deepspeed.ops.op_builder.FPQuantizerBuilder, + deepspeed.ops.op_builder.FusedLambBuilder, + deepspeed.ops.op_builder.FusedLionBuilder, + deepspeed.ops.op_builder.QuantizerBuilder, + deepspeed.ops.op_builder.RaggedOpsBuilder, + deepspeed.ops.op_builder.RandomLTDBuilder, + deepspeed.ops.op_builder.SparseAttnBuilder, + deepspeed.ops.op_builder.SpatialInferenceBuilder, + deepspeed.ops.op_builder.TransformerBuilder, + deepspeed.ops.op_builder.StochasticTransformerBuilder, + ] + + for builder in builders: + print(f"Compiling {builder.__name__}") + builder().load() + +if __name__ == "__main__": + compile_ops() +EOF +python compile_deepspeed_ops.py +``` + ## 物理机更新内核 ```shell