We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ab953b1 commit 486ed26Copy full SHA for 486ed26
pretrain/scripts/v3-1.7b-exp2-cpt-2epoch-sakura/train.sh
@@ -54,7 +54,7 @@ GRAD_CLIP=1
54
# 988240 + 988240 = 1976480
55
LR_WARMUP_STEPS=2000
56
LR_DECAY_ITERS=988240
57
-TRAIN_STEPS=$(((${LR_WARMUP_STEPS} + ${LR_DECAY_ITERS}) * 2)
+TRAIN_STEPS=$(((${LR_WARMUP_STEPS} + ${LR_DECAY_ITERS}) * 2))
58
59
# model config
60
TOKENIZER_MODEL=${ENV_DIR}/src/llm-jp-tokenizer/models/ver3.0/llm-jp-tokenizer-100k.ver3.0b1.model
0 commit comments