diff --git a/run_ds.sh b/run_ds.sh index 252803a..24a7965 100755 --- a/run_ds.sh +++ b/run_ds.sh @@ -14,13 +14,13 @@ SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)" DS_CONFIG="${DS_CONFIG:-$SCRIPT_DIR/ds_config_zero3.json}" # ==== 超参数(本地路径;可用 VAR=xxx ./run_ds.sh 覆写)==== -MODEL_NAME_OR_PATH="${MODEL_NAME_OR_PATH:-/home/test/Qwen3-1.7B}" +MODEL_NAME_OR_PATH="${MODEL_NAME_OR_PATH:-/home/test/Qwen3-8B}" # 明确区分训练/评测文件(可按需改成通配符) DATA_GLOB="${DATA_GLOB:-$HOME/datasets/my_corpus/train.jsonl}" EVAL_DATA_GLOB="${EVAL_DATA_GLOB:-$HOME/datasets/my_corpus/test.jsonl}" -OUTDIR="${OUTDIR:-$HOME/checkpoints/run-qwen3-1.7b}" +OUTDIR="${OUTDIR:-$HOME/checkpoints/run-qwen3-8b}" SEQ_LEN="${SEQ_LEN:-512}" LR="${LR:-2e-5}" GAS="${GAS:-1}"