"git@developer.sourcefind.cn:change/sglang.git" did not exist on "2afba1b1c1424f1a7706d6458359b15b555bae1c"
Commit 77361dae authored by liangjing's avatar liangjing
Browse files

update

parent c9289b90
...@@ -32,8 +32,9 @@ GPT_MODEL_ARGS=( ...@@ -32,8 +32,9 @@ GPT_MODEL_ARGS=(
) )
TRAINING_ARGS=( TRAINING_ARGS=(
--transformer-impl local --log-throughput
--use-legacy-models --transformer-impl transformer_engine
--use-mcore-models
--micro-batch-size 1 --micro-batch-size 1
--global-batch-size 256 --global-batch-size 256
--train-iters 100 --train-iters 100
......
...@@ -36,8 +36,9 @@ GPT_MODEL_ARGS=( ...@@ -36,8 +36,9 @@ GPT_MODEL_ARGS=(
) )
TRAINING_ARGS=( TRAINING_ARGS=(
--transformer-impl local --log-throughput
--use-legacy-models --transformer-impl transformer_engine
--use-mcore-models
--micro-batch-size 1 --micro-batch-size 1
--global-batch-size 512 --global-batch-size 512
--train-iters 100 --train-iters 100
......
...@@ -32,8 +32,8 @@ GPT_MODEL_ARGS=( ...@@ -32,8 +32,8 @@ GPT_MODEL_ARGS=(
TRAINING_ARGS=( TRAINING_ARGS=(
--log-throughput --log-throughput
--transformer-impl local --transformer-impl transformer_engine
--use-legacy-models --use-mcore-models
--micro-batch-size 1 --micro-batch-size 1
--global-batch-size 240 --global-batch-size 240
--train-iters 100 --train-iters 100
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment