diff --git a/train_mm_zero3_lora.sh b/train_mm_zero3_lora.sh index 2863764..eaeeda5 100755 --- a/train_mm_zero3_lora.sh +++ b/train_mm_zero3_lora.sh @@ -11,6 +11,6 @@ FORCE_COLOR=1 deepspeed --hostfile hostfile \ --learning_rate 1e-4 \ --warmup_ratio 0.03 \ --lora_r 16 --lora_alpha 32 --lora_dropout 0.05 \ - --max_steps 62 + --max_steps 62 \ --deepspeed /home/test/jd_train/ds_config_zero3_lora.json \ --report_to wandb --wandb_project ds-qwen3-lora