mirror of
https://gitee.com/ascend/ModelLink.git
synced 2024-12-04 21:07:51 +08:00
parent
c0be616e7e
commit
4b28e4f9ea
@ -49,6 +49,10 @@ GPT_ARGS="
|
||||
--use-glm-rope \
|
||||
--rotary-percent 0.5 \
|
||||
--normalization RMSNorm \
|
||||
--use-flash-attn \
|
||||
--use-fused-rmsnorm \
|
||||
--use-fused-swiglu \
|
||||
--num-workers 4 \
|
||||
--swiglu \
|
||||
--use-distributed-optimizer \
|
||||
--tokenizer-type PretrainedFromHF \
|
||||
@ -89,8 +93,8 @@ DATA_ARGS="
|
||||
|
||||
OUTPUT_ARGS="
|
||||
--log-interval 1 \
|
||||
--save-interval 500 \
|
||||
--eval-interval 500 \
|
||||
--save-interval 1000 \
|
||||
--eval-interval 1000 \
|
||||
--eval-iters 10 \
|
||||
"
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user