Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
LLaMA-Factory
Commits
2778a3d0
Commit
2778a3d0
authored
Jan 16, 2025
by
luopl
Browse files
updata to v0.9.1_stable
parent
e92143e3
Changes
172
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
20 additions
and
20 deletions
+20
-20
examples/extras/badam/llama3_full_sft.yaml
examples/extras/badam/llama3_full_sft.yaml
+1
-1
examples/extras/fsdp_qlora/llama3_lora_sft.yaml
examples/extras/fsdp_qlora/llama3_lora_sft.yaml
+1
-1
examples/extras/galore/llama3_full_sft.yaml
examples/extras/galore/llama3_full_sft.yaml
+1
-1
examples/extras/llama_pro/llama3_freeze_sft.yaml
examples/extras/llama_pro/llama3_freeze_sft.yaml
+1
-1
examples/extras/loraplus/llama3_lora_sft.yaml
examples/extras/loraplus/llama3_lora_sft.yaml
+1
-1
examples/extras/mod/llama3_full_sft.yaml
examples/extras/mod/llama3_full_sft.yaml
+1
-1
examples/extras/pissa/llama3_lora_sft.yaml
examples/extras/pissa/llama3_lora_sft.yaml
+1
-1
examples/train_full/llama3_full_predict.yaml
examples/train_full/llama3_full_predict.yaml
+1
-1
examples/train_full/llama3_full_sft_ds3.yaml
examples/train_full/llama3_full_sft_ds3.yaml
+1
-1
examples/train_full/qwen2vl_full_sft.yaml
examples/train_full/qwen2vl_full_sft.yaml
+1
-1
examples/train_lora/llama3_lora_dpo.yaml
examples/train_lora/llama3_lora_dpo.yaml
+1
-1
examples/train_lora/llama3_lora_kto.yaml
examples/train_lora/llama3_lora_kto.yaml
+1
-1
examples/train_lora/llama3_lora_ppo.yaml
examples/train_lora/llama3_lora_ppo.yaml
+1
-1
examples/train_lora/llama3_lora_predict.yaml
examples/train_lora/llama3_lora_predict.yaml
+1
-1
examples/train_lora/llama3_lora_pretrain.yaml
examples/train_lora/llama3_lora_pretrain.yaml
+1
-1
examples/train_lora/llama3_lora_reward.yaml
examples/train_lora/llama3_lora_reward.yaml
+1
-1
examples/train_lora/llama3_lora_sft.yaml
examples/train_lora/llama3_lora_sft.yaml
+1
-1
examples/train_lora/llama3_lora_sft_ds0.yaml
examples/train_lora/llama3_lora_sft_ds0.yaml
+1
-1
examples/train_lora/llama3_lora_sft_ds3.yaml
examples/train_lora/llama3_lora_sft_ds3.yaml
+1
-1
examples/train_lora/llama3_preprocess.yaml
examples/train_lora/llama3_preprocess.yaml
+1
-1
No files found.
examples/extras/badam/llama3_full_sft.yaml
View file @
2778a3d0
...
@@ -15,7 +15,7 @@ badam_verbose: 2
...
@@ -15,7 +15,7 @@ badam_verbose: 2
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/extras/fsdp_qlora/llama3_lora_sft.yaml
View file @
2778a3d0
...
@@ -11,7 +11,7 @@ lora_target: all
...
@@ -11,7 +11,7 @@ lora_target: all
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/extras/galore/llama3_full_sft.yaml
View file @
2778a3d0
...
@@ -14,7 +14,7 @@ galore_scale: 2.0
...
@@ -14,7 +14,7 @@ galore_scale: 2.0
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/extras/llama_pro/llama3_freeze_sft.yaml
View file @
2778a3d0
...
@@ -12,7 +12,7 @@ use_llama_pro: true
...
@@ -12,7 +12,7 @@ use_llama_pro: true
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/extras/loraplus/llama3_lora_sft.yaml
View file @
2778a3d0
...
@@ -11,7 +11,7 @@ loraplus_lr_ratio: 16.0
...
@@ -11,7 +11,7 @@ loraplus_lr_ratio: 16.0
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/extras/mod/llama3_full_sft.yaml
View file @
2778a3d0
...
@@ -10,7 +10,7 @@ mixture_of_depths: convert
...
@@ -10,7 +10,7 @@ mixture_of_depths: convert
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/extras/pissa/llama3_lora_sft.yaml
View file @
2778a3d0
...
@@ -13,7 +13,7 @@ pissa_convert: true
...
@@ -13,7 +13,7 @@ pissa_convert: true
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_full/llama3_full_predict.yaml
View file @
2778a3d0
...
@@ -9,7 +9,7 @@ finetuning_type: full
...
@@ -9,7 +9,7 @@ finetuning_type: full
### dataset
### dataset
eval_dataset
:
identity,alpaca_en_demo
eval_dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
50
max_samples
:
50
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_full/llama3_full_sft_ds3.yaml
View file @
2778a3d0
...
@@ -10,7 +10,7 @@ deepspeed: examples/deepspeed/ds_z3_config.json
...
@@ -10,7 +10,7 @@ deepspeed: examples/deepspeed/ds_z3_config.json
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_full/qwen2vl_full_sft.yaml
View file @
2778a3d0
...
@@ -10,7 +10,7 @@ deepspeed: examples/deepspeed/ds_z3_config.json
...
@@ -10,7 +10,7 @@ deepspeed: examples/deepspeed/ds_z3_config.json
### dataset
### dataset
dataset
:
mllm_demo,identity
dataset
:
mllm_demo,identity
template
:
qwen2_vl
template
:
qwen2_vl
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_dpo.yaml
View file @
2778a3d0
...
@@ -12,7 +12,7 @@ pref_loss: sigmoid # choices: [sigmoid (dpo), orpo, simpo]
...
@@ -12,7 +12,7 @@ pref_loss: sigmoid # choices: [sigmoid (dpo), orpo, simpo]
### dataset
### dataset
dataset
:
dpo_en_demo
dataset
:
dpo_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_kto.yaml
View file @
2778a3d0
...
@@ -11,7 +11,7 @@ pref_beta: 0.1
...
@@ -11,7 +11,7 @@ pref_beta: 0.1
### dataset
### dataset
dataset
:
kto_en_demo
dataset
:
kto_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_ppo.yaml
View file @
2778a3d0
...
@@ -11,7 +11,7 @@ lora_target: all
...
@@ -11,7 +11,7 @@ lora_target: all
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_predict.yaml
View file @
2778a3d0
...
@@ -10,7 +10,7 @@ finetuning_type: lora
...
@@ -10,7 +10,7 @@ finetuning_type: lora
### dataset
### dataset
eval_dataset
:
identity,alpaca_en_demo
eval_dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
50
max_samples
:
50
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_pretrain.yaml
View file @
2778a3d0
...
@@ -9,7 +9,7 @@ lora_target: all
...
@@ -9,7 +9,7 @@ lora_target: all
### dataset
### dataset
dataset
:
c4_demo
dataset
:
c4_demo
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_reward.yaml
View file @
2778a3d0
...
@@ -10,7 +10,7 @@ lora_target: all
...
@@ -10,7 +10,7 @@ lora_target: all
### dataset
### dataset
dataset
:
dpo_en_demo
dataset
:
dpo_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_sft.yaml
View file @
2778a3d0
...
@@ -10,7 +10,7 @@ lora_target: all
...
@@ -10,7 +10,7 @@ lora_target: all
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_sft_ds0.yaml
View file @
2778a3d0
...
@@ -11,7 +11,7 @@ deepspeed: examples/deepspeed/ds_z0_config.json
...
@@ -11,7 +11,7 @@ deepspeed: examples/deepspeed/ds_z0_config.json
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_lora_sft_ds3.yaml
View file @
2778a3d0
...
@@ -11,7 +11,7 @@ deepspeed: examples/deepspeed/ds_z3_config.json
...
@@ -11,7 +11,7 @@ deepspeed: examples/deepspeed/ds_z3_config.json
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
examples/train_lora/llama3_preprocess.yaml
View file @
2778a3d0
...
@@ -10,7 +10,7 @@ lora_target: all
...
@@ -10,7 +10,7 @@ lora_target: all
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
template
:
llama3
template
:
llama3
cutoff_len
:
1024
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
overwrite_cache
:
true
overwrite_cache
:
true
preprocessing_num_workers
:
16
preprocessing_num_workers
:
16
...
...
Prev
1
2
3
4
5
6
7
…
9
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment