train_omnisql_7b.sh 817 Bytes
Newer Older
mashun1's avatar
omnisql  
mashun1 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
set -e

LR=2e-5
EPOCHS=2
CONFIG_FILE="./accelerate_config_7b.yaml"
PER_DEVICE_TRAIN_BATCH_SIZE=1
MODEL_PATH="/home/ckpts/Qwen2.5-Coder-7B-Instruct"
CKPT_NUM=1
BASE_NAME="omnisql_7b_lr${LR}_epochs${EPOCHS}"
CKPT_DIR="./ckpts/$BASE_NAME"
LOG_DIR="./train_logs/$BASE_NAME"
# DATASET_DIR="./data/train_bird.json"
# DATASET_DIR="./data/train_spider.json"
DATASET_DIR="./data/train_synsql_part.json"

accelerate launch --main_process_port 10000 --config_file $CONFIG_FILE train.py \
    --per_device_train_batch_size $PER_DEVICE_TRAIN_BATCH_SIZE \
    --block_size 8192 \
    --seed 42 \
    --pretrained_model_name_or_path $MODEL_PATH \
    --epochs $EPOCHS \
    --lr $LR \
    --ckpt_num $CKPT_NUM \
    --tensorboard_log_dir $LOG_DIR \
    --output_ckpt_dir $CKPT_DIR \
    --sft_data_dir $DATASET_DIR \
    --mode sft