From d129562a4342e506f40a0d25da94aa1e64278ef7 Mon Sep 17 00:00:00 2001 From: hailin Date: Tue, 9 Sep 2025 19:20:56 +0800 Subject: [PATCH] . --- train_mm_zero3_lora.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/train_mm_zero3_lora.sh b/train_mm_zero3_lora.sh index 7492b73..2770e0c 100755 --- a/train_mm_zero3_lora.sh +++ b/train_mm_zero3_lora.sh @@ -12,5 +12,6 @@ FORCE_COLOR=1 deepspeed --hostfile hostfile \ --warmup_ratio 0.03 \ --lora_r 16 --lora_alpha 32 --lora_dropout 0.05 \ --max_steps 62 \ + --gradient_checkpointing \ --deepspeed /home/test/jd_train/ds_config_zero3_lora.json \ --report_to wandb --wandb_project ds-qwen3-lora