From 603b23dab0a65e9db2487dfdbf10f3c4e175daee Mon Sep 17 00:00:00 2001 From: hailin Date: Mon, 1 Sep 2025 18:36:35 +0800 Subject: [PATCH] . --- train_sft_ds.py | 1 + 1 file changed, 1 insertion(+) diff --git a/train_sft_ds.py b/train_sft_ds.py index ee0f055..5038b91 100644 --- a/train_sft_ds.py +++ b/train_sft_ds.py @@ -847,6 +847,7 @@ def main(): logging_steps=args.log_interval, save_steps=args.save_steps, save_total_limit=2, + optim="adamw_torch", # deepspeed=(args.deepspeed if args.deepspeed and os.path.isfile(args.deepspeed) else None), deepspeed=(args.deepspeed if use_ds else None), dataloader_drop_last=False,