diff --git a/train_mm_zero3_lora.sh b/train_mm_zero3_lora.sh index aad88e6..2863764 100755 --- a/train_mm_zero3_lora.sh +++ b/train_mm_zero3_lora.sh @@ -11,5 +11,6 @@ FORCE_COLOR=1 deepspeed --hostfile hostfile \ --learning_rate 1e-4 \ --warmup_ratio 0.03 \ --lora_r 16 --lora_alpha 32 --lora_dropout 0.05 \ + --max_steps 62 --deepspeed /home/test/jd_train/ds_config_zero3_lora.json \ --report_to wandb --wandb_project ds-qwen3-lora