From d2bdb8af9e0a11449d0b8a9cc4745f264c4341ad Mon Sep 17 00:00:00 2001 From: hailin Date: Tue, 23 Sep 2025 16:49:41 +0800 Subject: [PATCH] . --- lora_merge_zero3_safetensors.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/lora_merge_zero3_safetensors.sh b/lora_merge_zero3_safetensors.sh index 3c0bd4d..f93ba77 100755 --- a/lora_merge_zero3_safetensors.sh +++ b/lora_merge_zero3_safetensors.sh @@ -3,7 +3,7 @@ set -euo pipefail # ===== 可调参数 ===== CKPT_ROOT="/home/test/checkpoints/q3-32b-lora" # 若实际是 .../checkpoint-62/global_step62,请把 CKPT_ROOT 改成 .../checkpoint-62 -TAG="global_step30" +TAG="global_step200" HOSTS=(tn01 tn02 tn03 tn04 tn05 tn06) AGGREGATOR_HOST="tn06" # 本脚本运行/汇总所在机器 EXPECTED_SHARDS_PER_HOST=4 # 每机应写出分片数(按你的并行布局)