From 156805e04db30569c8f9c520db458d9136f91d79 Mon Sep 17 00:00:00 2001 From: hailin Date: Thu, 28 Aug 2025 19:02:07 +0800 Subject: [PATCH] . --- mm-zero3.sh | 4 ++-- ss-zero3.sh | 4 ++-- ss.sh | 4 ++-- 3 files changed, 6 insertions(+), 6 deletions(-) diff --git a/mm-zero3.sh b/mm-zero3.sh index 5c8a7fc..487c963 100755 --- a/mm-zero3.sh +++ b/mm-zero3.sh @@ -1,9 +1,9 @@ deepspeed --hostfile hostfile \ --num_nodes 6 --num_gpus 4 \ /home/test/jd_train/train_sft_ds.py \ - --model_name_or_path /home/test/Qwen3-1.7B \ + --model_name_or_path /home/test/Qwen3-8B \ --data_glob "/home/test/datasets/my_corpus/train.jsonl" \ - --output_dir /home/test/checkpoints/q3-1_7b-ds4 \ + --output_dir /home/test/checkpoints/q3-8b-ds4 \ --seq_len 512 \ --per_device_train_batch_size 1 \ --gradient_accumulation_steps 1 \ diff --git a/ss-zero3.sh b/ss-zero3.sh index 8e93f2b..4bb4782 100755 --- a/ss-zero3.sh +++ b/ss-zero3.sh @@ -3,9 +3,9 @@ export PYTORCH_CUDA_ALLOC_CONF="max_split_size_mb:128" export NCCL_DEBUG=INFO torchrun --nproc_per_node 4 /home/test/jd_train/train_sft_ds.py \ - --model_name_or_path /home/test/Qwen3-1.7B \ + --model_name_or_path /home/test/Qwen3-8B \ --data_glob "/home/test/datasets/my_corpus/train.jsonl" \ - --output_dir /home/test/checkpoints/q3-1_7b-ds4 \ + --output_dir /home/test/checkpoints/q3-8b-ds4 \ --seq_len 512 \ --per_device_train_batch_size 1 \ --gradient_accumulation_steps 1 \ diff --git a/ss.sh b/ss.sh index d82ac4b..b3f4f6c 100755 --- a/ss.sh +++ b/ss.sh @@ -4,9 +4,9 @@ export NCCL_DEBUG=INFO export CUDA_VISIBLE_DEVICES=0 torchrun --nproc_per_node 1 /home/test/jd_train/train_sft_ds.py \ - --model_name_or_path /home/test/Qwen3-1.7B \ + --model_name_or_path /home/test/Qwen3-8B \ --data_glob "/home/test/datasets/my_corpus/train.jsonl" \ - --output_dir /home/test/checkpoints/smoke-q3-1_7b-ds \ + --output_dir /home/test/checkpoints/smoke-q3-8b-ds \ --seq_len 512 \ --per_device_train_batch_size 1 \ --gradient_accumulation_steps 1 \