Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
LLaMA-Factory
Commits
8293100a
Commit
8293100a
authored
Jan 16, 2025
by
luopl
Browse files
update to 0.9.2.dev0
parent
2778a3d0
Changes
124
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
114 additions
and
3 deletions
+114
-3
examples/inference/llama3_vllm.yaml
examples/inference/llama3_vllm.yaml
+1
-0
examples/inference/llava1_5.yaml
examples/inference/llava1_5.yaml
+2
-0
examples/inference/qwen2_vl.yaml
examples/inference/qwen2_vl.yaml
+2
-0
examples/merge_lora/llama3_gptq.yaml
examples/merge_lora/llama3_gptq.yaml
+1
-0
examples/merge_lora/llama3_lora_sft.yaml
examples/merge_lora/llama3_lora_sft.yaml
+1
-0
examples/merge_lora/qwen2vl_lora_sft.yaml
examples/merge_lora/qwen2vl_lora_sft.yaml
+1
-0
examples/train_full/llama3_full_sft.yaml
examples/train_full/llama3_full_sft.yaml
+40
-0
examples/train_full/qwen2vl_full_sft.yaml
examples/train_full/qwen2vl_full_sft.yaml
+6
-2
examples/train_lora/llama3_lora_dpo.yaml
examples/train_lora/llama3_lora_dpo.yaml
+1
-0
examples/train_lora/llama3_lora_eval.yaml
examples/train_lora/llama3_lora_eval.yaml
+1
-0
examples/train_lora/llama3_lora_kto.yaml
examples/train_lora/llama3_lora_kto.yaml
+1
-0
examples/train_lora/llama3_lora_ppo.yaml
examples/train_lora/llama3_lora_ppo.yaml
+1
-0
examples/train_lora/llama3_lora_pretrain.yaml
examples/train_lora/llama3_lora_pretrain.yaml
+1
-0
examples/train_lora/llama3_lora_reward.yaml
examples/train_lora/llama3_lora_reward.yaml
+1
-0
examples/train_lora/llama3_lora_sft.yaml
examples/train_lora/llama3_lora_sft.yaml
+1
-0
examples/train_lora/llama3_lora_sft_ds3.yaml
examples/train_lora/llama3_lora_sft_ds3.yaml
+2
-1
examples/train_lora/llama3_lora_sft_ray.yaml
examples/train_lora/llama3_lora_sft_ray.yaml
+48
-0
examples/train_lora/llama3_preprocess.yaml
examples/train_lora/llama3_preprocess.yaml
+1
-0
examples/train_lora/llava1_5_lora_sft.yaml
examples/train_lora/llava1_5_lora_sft.yaml
+1
-0
examples/train_lora/qwen2vl_lora_dpo.yaml
examples/train_lora/qwen2vl_lora_dpo.yaml
+1
-0
No files found.
examples/inference/llama3_vllm.yaml
View file @
8293100a
...
@@ -2,3 +2,4 @@ model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
...
@@ -2,3 +2,4 @@ model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
template
:
llama3
template
:
llama3
infer_backend
:
vllm
infer_backend
:
vllm
vllm_enforce_eager
:
true
vllm_enforce_eager
:
true
trust_remote_code
:
true
examples/inference/llava1_5.yaml
View file @
8293100a
model_name_or_path
:
llava-hf/llava-1.5-7b-hf
model_name_or_path
:
llava-hf/llava-1.5-7b-hf
template
:
llava
template
:
llava
infer_backend
:
huggingface
# choices: [huggingface, vllm]
trust_remote_code
:
true
examples/inference/qwen2_vl.yaml
View file @
8293100a
model_name_or_path
:
Qwen/Qwen2-VL-7B-Instruct
model_name_or_path
:
Qwen/Qwen2-VL-7B-Instruct
template
:
qwen2_vl
template
:
qwen2_vl
infer_backend
:
huggingface
# choices: [huggingface, vllm]
trust_remote_code
:
true
examples/merge_lora/llama3_gptq.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
template
:
llama3
template
:
llama3
trust_remote_code
:
true
### export
### export
export_dir
:
models/llama3_gptq
export_dir
:
models/llama3_gptq
...
...
examples/merge_lora/llama3_lora_sft.yaml
View file @
8293100a
...
@@ -5,6 +5,7 @@ model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
...
@@ -5,6 +5,7 @@ model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
adapter_name_or_path
:
saves/llama3-8b/lora/sft
adapter_name_or_path
:
saves/llama3-8b/lora/sft
template
:
llama3
template
:
llama3
finetuning_type
:
lora
finetuning_type
:
lora
trust_remote_code
:
true
### export
### export
export_dir
:
models/llama3_lora_sft
export_dir
:
models/llama3_lora_sft
...
...
examples/merge_lora/qwen2vl_lora_sft.yaml
View file @
8293100a
...
@@ -5,6 +5,7 @@ model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
...
@@ -5,6 +5,7 @@ model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
adapter_name_or_path
:
saves/qwen2_vl-7b/lora/sft
adapter_name_or_path
:
saves/qwen2_vl-7b/lora/sft
template
:
qwen2_vl
template
:
qwen2_vl
finetuning_type
:
lora
finetuning_type
:
lora
trust_remote_code
:
true
### export
### export
export_dir
:
models/qwen2_vl_lora_sft
export_dir
:
models/qwen2_vl_lora_sft
...
...
examples/train_full/llama3_full_sft.yaml
0 → 100644
View file @
8293100a
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
full
deepspeed
:
examples/deepspeed/ds_z3_config.json
# choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
### dataset
dataset
:
identity,alpaca_en_demo
template
:
llama3
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
### output
output_dir
:
saves/llama3-8b/full/sft
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
2
learning_rate
:
1.0e-5
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
### eval
val_size
:
0.1
per_device_eval_batch_size
:
1
eval_strategy
:
steps
eval_steps
:
500
examples/train_full/qwen2vl_full_sft.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
Qwen/Qwen2-VL-7B-Instruct
model_name_or_path
:
Qwen/Qwen2-VL-7B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
sft
stage
:
sft
do_train
:
true
do_train
:
true
finetuning_type
:
full
finetuning_type
:
full
deepspeed
:
examples/deepspeed/ds_z3_config.json
freeze_vision_tower
:
true
# choices: [true, false]
freeze_multi_modal_projector
:
true
# choices: [true, false]
train_mm_proj_only
:
false
# choices: [true, false]
deepspeed
:
examples/deepspeed/ds_z3_config.json
# choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
### dataset
### dataset
dataset
:
mllm_demo,identity
dataset
:
mllm_demo,identity
,alpaca_en_demo
template
:
qwen2_vl
template
:
qwen2_vl
cutoff_len
:
2048
cutoff_len
:
2048
max_samples
:
1000
max_samples
:
1000
...
...
examples/train_lora/llama3_lora_dpo.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
dpo
stage
:
dpo
...
...
examples/train_lora/llama3_lora_eval.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
adapter_name_or_path
:
saves/llama3-8b/lora/sft
adapter_name_or_path
:
saves/llama3-8b/lora/sft
trust_remote_code
:
true
### method
### method
finetuning_type
:
lora
finetuning_type
:
lora
...
...
examples/train_lora/llama3_lora_kto.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
kto
stage
:
kto
...
...
examples/train_lora/llama3_lora_ppo.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
reward_model
:
saves/llama3-8b/lora/reward
reward_model
:
saves/llama3-8b/lora/reward
trust_remote_code
:
true
### method
### method
stage
:
ppo
stage
:
ppo
...
...
examples/train_lora/llama3_lora_pretrain.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
pt
stage
:
pt
...
...
examples/train_lora/llama3_lora_reward.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
rm
stage
:
rm
...
...
examples/train_lora/llama3_lora_sft.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
sft
stage
:
sft
...
...
examples/train_lora/llama3_lora_sft_ds3.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
sft
stage
:
sft
do_train
:
true
do_train
:
true
finetuning_type
:
lora
finetuning_type
:
lora
lora_target
:
all
lora_target
:
all
deepspeed
:
examples/deepspeed/ds_z3_config.json
deepspeed
:
examples/deepspeed/ds_z3_config.json
# choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
### dataset
### dataset
dataset
:
identity,alpaca_en_demo
dataset
:
identity,alpaca_en_demo
...
...
examples/train_lora/llama3_lora_sft_ray.yaml
0 → 100644
View file @
8293100a
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
# or use local absolute path
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
lora
lora_target
:
all
### dataset
dataset
:
identity,alpaca_en_demo
dataset_dir
:
REMOTE:llamafactory/demo_data
# or use local absolute path
template
:
llama3
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
### output
output_dir
:
tmp_dir
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
8
learning_rate
:
1.0e-4
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
### eval
val_size
:
0.1
per_device_eval_batch_size
:
1
eval_strategy
:
steps
eval_steps
:
500
### ray
ray_run_name
:
llama3_8b_sft_lora
ray_num_workers
:
4
# number of GPUs to use
resources_per_worker
:
GPU
:
1
placement_strategy
:
PACK
examples/train_lora/llama3_preprocess.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
sft
stage
:
sft
...
...
examples/train_lora/llava1_5_lora_sft.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
llava-hf/llava-1.5-7b-hf
model_name_or_path
:
llava-hf/llava-1.5-7b-hf
trust_remote_code
:
true
### method
### method
stage
:
sft
stage
:
sft
...
...
examples/train_lora/qwen2vl_lora_dpo.yaml
View file @
8293100a
### model
### model
model_name_or_path
:
Qwen/Qwen2-VL-7B-Instruct
model_name_or_path
:
Qwen/Qwen2-VL-7B-Instruct
trust_remote_code
:
true
### method
### method
stage
:
dpo
stage
:
dpo
...
...
Prev
1
2
3
4
5
6
7
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment