Commit 744a3911 authored by zhougaofeng's avatar zhougaofeng
Browse files

Update single_node.sh

parent a35dc7d8
...@@ -3,7 +3,7 @@ ...@@ -3,7 +3,7 @@
export HIP_VISIBLE_DEVICES=6 export HIP_VISIBLE_DEVICES=6
python src/train.py \ python src/train.py \
--stage sft --do_train \ --stage sft --do_train \
--model_name_or_path /home/practice/deepseek-math-7b-base \ --model_name_or_path /home/practice/deepseek-math-7b-base <Your Path>\
--dataset alpaca_en_demo --template deepseek --finetuning_type lora --lora_target q_proj,v_proj \ --dataset alpaca_en_demo --template deepseek --finetuning_type lora --lora_target q_proj,v_proj \
--output_dir saves/deepseek/lora/sft \ --output_dir saves/deepseek/lora/sft \
--overwrite_cache --per_device_train_batch_size 2 --gradient_accumulation_steps 32 --lr_scheduler_type cosine \ --overwrite_cache --per_device_train_batch_size 2 --gradient_accumulation_steps 32 --lr_scheduler_type cosine \
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment