From fa3fce0e40923d64382234202702bb28e0a0518e Mon Sep 17 00:00:00 2001 From: hailin Date: Tue, 26 Aug 2025 14:38:26 +0800 Subject: [PATCH] . --- train_sft_ds.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/train_sft_ds.py b/train_sft_ds.py index 2f87781..0bcf065 100644 --- a/train_sft_ds.py +++ b/train_sft_ds.py @@ -301,7 +301,7 @@ def parse_args(): ap.add_argument("--save_steps", type=int, default=500) ap.add_argument("--eval_ratio", type=float, default=0.0) ap.add_argument("--seed", type=int, default=1337) - ap.add_argument("--deepspeed", type=str, default="ds_config_zero3.json") + #ap.add_argument("--deepspeed", type=str, default="ds_config_zero3.json") ap.add_argument("--gradient_checkpointing", action="store_true") ap.add_argument("--bf16", action="store_true", help="3090/A100/H100 等可开 bf16;同时在 DS 配置里也要开")