This commit is contained in:
hailin 2025-08-08 21:43:40 +08:00
parent 4060a7237c
commit af4cc28de2
1 changed files with 23 additions and 18 deletions

View File

@ -173,32 +173,37 @@ log "Build & install DeepSpeed"
cd "${REPO_PATH}" cd "${REPO_PATH}"
pip uninstall -y deepspeed >/dev/null 2>&1 || true pip uninstall -y deepspeed >/dev/null 2>&1 || true
rm -rf build rm -rf build
# —— 编译前置(强烈建议)——
python - <<'PY'
import sys, subprocess
subprocess.check_call([sys.executable, "-m", "pip", "install", "-U", "pip", "setuptools", "wheel", "ninja"])
PY
# 并行编译提速(按 CPU 核心数调)
export MAX_JOBS=${MAX_JOBS:-$(nproc)}
# —— DeepSpeed 功能开关 ——
# 编译核心 CUDA/C++ 扩展(必须)
export DS_BUILD_OPS=1 export DS_BUILD_OPS=1
export DS_BUILD_AIO=1
export DS_BUILD_FUSED_ADAM=1
export DS_BUILD_CPU_ADAM=1
export DS_BUILD_EVOFORMER_ATTN=0
export DS_BUILD_AIO=1 # 训练常用加速内核
export DS_BUILD_TRANSFORMER=1
export DS_BUILD_SPARSE_ATTN=1
export DS_BUILD_FLASH_ATTN=1
# 常用优化器(强烈建议开)
export DS_BUILD_FUSED_ADAM=1 export DS_BUILD_FUSED_ADAM=1
export DS_BUILD_CPU_ADAM=1 export DS_BUILD_CPU_ADAM=1
# 全部关掉和推理/transformer/CUTLASS/flash/sparse 有关的东西 # 可选:异步 IOLinux 才生效Windows 不支持 AIO/GDS
export DS_BUILD_EVOFORMER_ATTN=0 export DS_BUILD_AIO=1
export DS_BUILD_INFERENCE=0
export DS_BUILD_TRANSFORMER=0
export DS_BUILD_SPARSE_ATTN=0
export DS_BUILD_SDP_ATTN=0
export DS_BUILD_FLASH_ATTN=0
export DS_BUILD_QKV_GEMM=0
export DS_BUILD_CUTLASS=0
unset CUTLASS_PATH
# 如需推理内核export DS_BUILD_TRANSFORMER=1 # 安装(带详细日志)
# 提供更详细日志便于排错
pip install -v . pip install -v .
# ============================= # =============================
# 7. 验证安装 # 7. 验证安装
# ============================= # =============================