llama3_preprocess.yaml 450 Bytes
Newer Older
chenych's avatar
chenych committed
1
2
### model
model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
luopl's avatar
luopl committed
3
trust_remote_code: true
chenych's avatar
chenych committed
4
5
6
7
8

### method
stage: sft
do_train: true
finetuning_type: lora
chenych's avatar
chenych committed
9
lora_rank: 8
chenych's avatar
chenych committed
10
11
12
13
14
lora_target: all

### dataset
dataset: identity,alpaca_en_demo
template: llama3
luopl's avatar
luopl committed
15
cutoff_len: 2048
chenych's avatar
chenych committed
16
17
18
19
20
21
22
23
max_samples: 1000
overwrite_cache: true
preprocessing_num_workers: 16
tokenized_path: saves/llama3-8b/dataset/sft

### output
output_dir: saves/llama3-8b/lora/sft
overwrite_output_dir: true