This commit is contained in:
hailin 2025-09-01 20:41:39 +08:00
parent b8fb783871
commit 123a49db1b
1 changed files with 3 additions and 1 deletions

View File

@ -4,7 +4,9 @@ export TORCH_EXTENSIONS_DIR=/tmp/$USER/torch_ext
export PYTORCH_CUDA_ALLOC_CONF="max_split_size_mb:128,expandable_segments:True,garbage_collection_threshold:0.9" export PYTORCH_CUDA_ALLOC_CONF="max_split_size_mb:128,expandable_segments:True,garbage_collection_threshold:0.9"
export PYTORCH_CUDA_ALLOC_CONF="max_split_size_mb:64" export OMP_NUM_THREADS=8
export MKL_NUM_THREADS=8
export OPENBLAS_NUM_THREADS=8
deepspeed --hostfile hostfile \ deepspeed --hostfile hostfile \
--num_nodes 6 --num_gpus 4 \ --num_nodes 6 --num_gpus 4 \