"vscode:/vscode.git/clone" did not exist on "20563f6ee5bbd5690e42ff931aa7d256a2285cdc"
Commit b143393c authored by jerrrrry's avatar jerrrrry
Browse files

Upload New File

parent 4567a27f
for para in $*
do
if [[ $para == --profiling* ]];then
profiling=${para#*=}
fi
done
CURRENT_DIR=$( cd "$( dirname "$0" )" && pwd )
MEGATRON_PATH=$( dirname $( dirname ${CURRENT_DIR}))
# Those variables need to modify
DTK_ENV="/opt/dtk/env.sh" # where env.sh of dtk
DATA_PATH="/workspace/OEM_ADVTG_TEST/dcu_megatron/mrgatron-pretrain-datasets/llama3dataset/my-llama_text_document" # path to oscar-1GB_head-llama2_text_document
TOKENIZER_MODEL_PATH="/workspace/OEM_ADVTG_TEST/dcu_megatron/mrgatron-pretrain-datasets/llama3dataset/tokenizer.model" # path to tokenizer.model
CHECKPOINT_PATH="./ckpt/llama3/" # path to ckpt
NCCL_ENV=${MEGATRON_PATH}/requirements/env.sh # Please adjust the variables based on the actual NET being used
LAUNCH_WITH_BINDING=${MEGATRON_PATH}/requirements/launch_with_binding.sh # Please adjust the variables based on the actual NET being used
# Those variables no need to modify
HOSTFILE="hostfile_$(basename "$0" | sed -E 's/^run_(.+)\.sh$/\1/')"
GPUS=$(($(cat ${HOSTFILE}|sort|uniq |wc -l)*8))
HOST="$(cat ${HOSTFILE} |sed -n "1p"|awk -F ' ' '{print $1}')"
PORT="25900"
# Runs Llama3 70B model
source ${NCCL_ENV}
mpirun -np ${GPUS} --hostfile ${HOSTFILE} \
--allow-run-as-root \
--bind-to none \
--mca plm_rsh_no_tree_spawn 1 \
bash -c "
source ${DTK_ENV} && \
source ${NCCL_ENV} && \
./train_llama3_8b_$((${GPUS} / 8))nodes.sh \
${HOST} \
${PORT} \
--data_path=$DATA_PATH \
--tokenizer_path=$TOKENIZER_MODEL_PATH \
--checkpoint_path=$CHECKPOINT_PATH \
--launch_with_binding=${LAUNCH_WITH_BINDING} \
--profiling=$profiling" > log-$((${GPUS} / 8))nodes-`date +%F-%H%M`.log 2>&1
wait
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment