From 619bebcf57edeebffbbe99420fe195bf3bc50162 Mon Sep 17 00:00:00 2001 From: hailin Date: Tue, 26 Aug 2025 20:02:49 +0800 Subject: [PATCH] . --- train_sft_ds.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/train_sft_ds.py b/train_sft_ds.py index c1a4500..8ec18b9 100644 --- a/train_sft_ds.py +++ b/train_sft_ds.py @@ -634,7 +634,9 @@ def main(): save_steps=args.save_steps, save_total_limit=2, deepspeed=(args.deepspeed if args.deepspeed and os.path.isfile(args.deepspeed) else None), - dataloader_drop_last=False, # 关键:别丢尾,避免空 batch + # dataloader_drop_last=False, # 关键:别丢尾,避免空 batch + dataloader_drop_last=True, # 关键:别丢尾,避免空 batch + dispatch_batches=False, dataloader_num_workers=0, dataloader_prefetch_factor=None, dataloader_pin_memory=False,