Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
TS-MODELS-OPT
training
Autonomous-Driving-models
Commits
5ed76316
Commit
5ed76316
authored
Apr 08, 2026
by
雍大凯
Browse files
models add
parent
b2379236
Changes
290
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
494 additions
and
0 deletions
+494
-0
docker-hub/qwen2.5-vl/llama-factory/examples/extras/llama_pro/expand.sh
...n2.5-vl/llama-factory/examples/extras/llama_pro/expand.sh
+6
-0
docker-hub/qwen2.5-vl/llama-factory/examples/extras/llama_pro/llama3_freeze_sft.yaml
...-factory/examples/extras/llama_pro/llama3_freeze_sft.yaml
+45
-0
docker-hub/qwen2.5-vl/llama-factory/examples/extras/loraplus/llama3_lora_sft.yaml
...ama-factory/examples/extras/loraplus/llama3_lora_sft.yaml
+45
-0
docker-hub/qwen2.5-vl/llama-factory/examples/extras/mod/llama3_full_sft.yaml
...vl/llama-factory/examples/extras/mod/llama3_full_sft.yaml
+44
-0
docker-hub/qwen2.5-vl/llama-factory/examples/extras/muon/qwen2_full_sft.yaml
...vl/llama-factory/examples/extras/muon/qwen2_full_sft.yaml
+43
-0
docker-hub/qwen2.5-vl/llama-factory/examples/extras/nlg_eval/llama3_lora_predict.yaml
...factory/examples/extras/nlg_eval/llama3_lora_predict.yaml
+31
-0
docker-hub/qwen2.5-vl/llama-factory/examples/extras/pissa/init.sh
...ub/qwen2.5-vl/llama-factory/examples/extras/pissa/init.sh
+5
-0
docker-hub/qwen2.5-vl/llama-factory/examples/extras/pissa/llama3_lora_sft.yaml
.../llama-factory/examples/extras/pissa/llama3_lora_sft.yaml
+47
-0
docker-hub/qwen2.5-vl/llama-factory/examples/inference/llama3.yaml
...b/qwen2.5-vl/llama-factory/examples/inference/llama3.yaml
+4
-0
docker-hub/qwen2.5-vl/llama-factory/examples/inference/llama3_full_sft.yaml
...-vl/llama-factory/examples/inference/llama3_full_sft.yaml
+4
-0
docker-hub/qwen2.5-vl/llama-factory/examples/inference/llama3_lora_sft.yaml
...-vl/llama-factory/examples/inference/llama3_lora_sft.yaml
+5
-0
docker-hub/qwen2.5-vl/llama-factory/examples/inference/qwen2_5vl.yaml
...wen2.5-vl/llama-factory/examples/inference/qwen2_5vl.yaml
+4
-0
docker-hub/qwen2.5-vl/llama-factory/examples/merge_lora/llama3_full_sft.yaml
...vl/llama-factory/examples/merge_lora/llama3_full_sft.yaml
+10
-0
docker-hub/qwen2.5-vl/llama-factory/examples/merge_lora/llama3_gptq.yaml
...2.5-vl/llama-factory/examples/merge_lora/llama3_gptq.yaml
+12
-0
docker-hub/qwen2.5-vl/llama-factory/examples/merge_lora/llama3_lora_sft.yaml
...vl/llama-factory/examples/merge_lora/llama3_lora_sft.yaml
+13
-0
docker-hub/qwen2.5-vl/llama-factory/examples/merge_lora/qwen2_5vl_lora_sft.yaml
...llama-factory/examples/merge_lora/qwen2_5vl_lora_sft.yaml
+13
-0
docker-hub/qwen2.5-vl/llama-factory/examples/train_full/llama3_full_sft.yaml
...vl/llama-factory/examples/train_full/llama3_full_sft.yaml
+45
-0
docker-hub/qwen2.5-vl/llama-factory/examples/train_full/qwen2_5vl_full_sft.yaml
...llama-factory/examples/train_full/qwen2_5vl_full_sft.yaml
+51
-0
docker-hub/qwen2.5-vl/llama-factory/examples/train_lora/llama3_lora_dpo.yaml
...vl/llama-factory/examples/train_lora/llama3_lora_dpo.yaml
+48
-0
docker-hub/qwen2.5-vl/llama-factory/examples/train_lora/llama3_lora_eval.yaml
...l/llama-factory/examples/train_lora/llama3_lora_eval.yaml
+19
-0
No files found.
docker-hub/qwen2.5-vl/llama-factory/examples/extras/llama_pro/expand.sh
0 → 100644
View file @
5ed76316
#!/bin/bash
python scripts/llama_pro.py
\
--model_name_or_path
meta-llama/Meta-Llama-3-8B-Instruct
\
--output_dir
models/llama3-8b-pro
\
--num_expand
8
docker-hub/qwen2.5-vl/llama-factory/examples/extras/llama_pro/llama3_freeze_sft.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
models/llama3-8b-pro
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
freeze
freeze_trainable_layers
:
8
freeze_trainable_modules
:
all
use_llama_pro
:
true
### dataset
dataset
:
identity,alpaca_en_demo
template
:
llama3
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/llama3-8b-pro/freeze/sft
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
save_only_model
:
false
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
8
learning_rate
:
1.0e-4
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
### eval
# val_size: 0.1
# per_device_eval_batch_size: 1
# eval_strategy: steps
# eval_steps: 500
docker-hub/qwen2.5-vl/llama-factory/examples/extras/loraplus/llama3_lora_sft.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
lora
lora_rank
:
8
lora_target
:
all
loraplus_lr_ratio
:
16.0
### dataset
dataset
:
identity,alpaca_en_demo
template
:
llama3
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/llama3-8b/lora/sft
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
save_only_model
:
false
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
8
learning_rate
:
1.0e-4
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
### eval
# val_size: 0.1
# per_device_eval_batch_size: 1
# eval_strategy: steps
# eval_steps: 500
docker-hub/qwen2.5-vl/llama-factory/examples/extras/mod/llama3_full_sft.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
full
mixture_of_depths
:
convert
### dataset
dataset
:
identity,alpaca_en_demo
template
:
llama3
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/llama3-8b-mod/full/sft
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
save_only_model
:
false
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
8
optim
:
paged_adamw_8bit
learning_rate
:
1.0e-5
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
pure_bf16
:
true
ddp_timeout
:
180000000
### eval
# val_size: 0.1
# per_device_eval_batch_size: 1
# eval_strategy: steps
# eval_steps: 500
docker-hub/qwen2.5-vl/llama-factory/examples/extras/muon/qwen2_full_sft.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
Qwen/Qwen2-1.5B-Instruct
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
full
use_muon
:
true
### dataset
dataset
:
identity,alpaca_en_demo
template
:
qwen
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/qwen2-1_5b/full/sft
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
save_only_model
:
false
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
8
learning_rate
:
1.0e-5
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
### eval
# val_size: 0.1
# per_device_eval_batch_size: 1
# eval_strategy: steps
# eval_steps: 500
docker-hub/qwen2.5-vl/llama-factory/examples/extras/nlg_eval/llama3_lora_predict.yaml
0 → 100644
View file @
5ed76316
# The batch generation can be SLOW using this config.
# For faster inference, we recommend to use `scripts/vllm_infer.py`.
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
adapter_name_or_path
:
saves/llama3-8b/lora/sft
trust_remote_code
:
true
### method
stage
:
sft
do_predict
:
true
finetuning_type
:
lora
### dataset
eval_dataset
:
identity,alpaca_en_demo
template
:
llama3
cutoff_len
:
2048
max_samples
:
50
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/llama3-8b/lora/predict
overwrite_output_dir
:
true
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### eval
per_device_eval_batch_size
:
1
predict_with_generate
:
true
ddp_timeout
:
180000000
docker-hub/qwen2.5-vl/llama-factory/examples/extras/pissa/init.sh
0 → 100644
View file @
5ed76316
#!/bin/bash
python scripts/pissa_init.py
\
--model_name_or_path
meta-llama/Meta-Llama-3-8B-Instruct
\
--output_dir
models/llama3-8b-pissa
docker-hub/qwen2.5-vl/llama-factory/examples/extras/pissa/llama3_lora_sft.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
lora
lora_rank
:
8
lora_target
:
all
pissa_init
:
true
pissa_iter
:
16
pissa_convert
:
true
### dataset
dataset
:
identity,alpaca_en_demo
template
:
llama3
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/llama3-8b/lora/sft
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
save_only_model
:
false
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
8
learning_rate
:
1.0e-4
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
### eval
# val_size: 0.1
# per_device_eval_batch_size: 1
# eval_strategy: steps
# eval_steps: 500
docker-hub/qwen2.5-vl/llama-factory/examples/inference/llama3.yaml
0 → 100644
View file @
5ed76316
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
template
:
llama3
infer_backend
:
huggingface
# choices: [huggingface, vllm, sglang]
trust_remote_code
:
true
docker-hub/qwen2.5-vl/llama-factory/examples/inference/llama3_full_sft.yaml
0 → 100644
View file @
5ed76316
model_name_or_path
:
saves/llama3-8b/full/sft
template
:
llama3
infer_backend
:
huggingface
# choices: [huggingface, vllm, sglang]
trust_remote_code
:
true
docker-hub/qwen2.5-vl/llama-factory/examples/inference/llama3_lora_sft.yaml
0 → 100644
View file @
5ed76316
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
adapter_name_or_path
:
saves/llama3-8b/lora/sft
template
:
llama3
infer_backend
:
huggingface
# choices: [huggingface, vllm, sglang]
trust_remote_code
:
true
docker-hub/qwen2.5-vl/llama-factory/examples/inference/qwen2_5vl.yaml
0 → 100644
View file @
5ed76316
model_name_or_path
:
Qwen/Qwen2.5-VL-7B-Instruct
template
:
qwen2_vl
infer_backend
:
huggingface
# choices: [huggingface, vllm, sglang]
trust_remote_code
:
true
docker-hub/qwen2.5-vl/llama-factory/examples/merge_lora/llama3_full_sft.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
saves/llama3-8b/full/sft
template
:
llama3
trust_remote_code
:
true
### export
export_dir
:
output/llama3_full_sft
export_size
:
5
export_device
:
cpu
# choices: [cpu, auto]
export_legacy_format
:
false
docker-hub/qwen2.5-vl/llama-factory/examples/merge_lora/llama3_gptq.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
template
:
llama3
trust_remote_code
:
true
### export
export_dir
:
output/llama3_gptq
export_quantization_bit
:
4
export_quantization_dataset
:
data/c4_demo.jsonl
export_size
:
5
export_device
:
cpu
# choices: [cpu, auto]
export_legacy_format
:
false
docker-hub/qwen2.5-vl/llama-factory/examples/merge_lora/llama3_lora_sft.yaml
0 → 100644
View file @
5ed76316
### Note: DO NOT use quantized model or quantization_bit when merging lora adapters
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
adapter_name_or_path
:
saves/llama3-8b/lora/sft
template
:
llama3
trust_remote_code
:
true
### export
export_dir
:
output/llama3_lora_sft
export_size
:
5
export_device
:
cpu
# choices: [cpu, auto]
export_legacy_format
:
false
docker-hub/qwen2.5-vl/llama-factory/examples/merge_lora/qwen2_5vl_lora_sft.yaml
0 → 100644
View file @
5ed76316
### Note: DO NOT use quantized model or quantization_bit when merging lora adapters
### model
model_name_or_path
:
Qwen/Qwen2.5-VL-7B-Instruct
adapter_name_or_path
:
saves/qwen2_5vl-7b/lora/sft
template
:
qwen2_vl
trust_remote_code
:
true
### export
export_dir
:
output/qwen2_5vl_lora_sft
export_size
:
5
export_device
:
cpu
# choices: [cpu, auto]
export_legacy_format
:
false
docker-hub/qwen2.5-vl/llama-factory/examples/train_full/llama3_full_sft.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
full
deepspeed
:
examples/deepspeed/ds_z3_config.json
# choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
### dataset
dataset
:
identity,alpaca_en_demo
template
:
llama3
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/llama3-8b/full/sft
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
save_only_model
:
false
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
2
learning_rate
:
1.0e-5
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
resume_from_checkpoint
:
null
### eval
# eval_dataset: alpaca_en_demo
# val_size: 0.1
# per_device_eval_batch_size: 1
# eval_strategy: steps
# eval_steps: 500
docker-hub/qwen2.5-vl/llama-factory/examples/train_full/qwen2_5vl_full_sft.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
/models/qwen2.5/Qwen2.5-VL-7B-Instruct/
image_max_pixels
:
262144
video_max_pixels
:
16384
trust_remote_code
:
true
### method
stage
:
sft
do_train
:
true
finetuning_type
:
full
freeze_vision_tower
:
true
freeze_multi_modal_projector
:
true
freeze_language_model
:
false
deepspeed
:
examples/deepspeed/ds_z3_config.json
### dataset
dataset
:
mllm_demo,identity,alpaca_en_demo
template
:
qwen2_vl
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/qwen2_5vl-7b/full/sft
logging_steps
:
10
save_steps
:
0
save_strategy
:
"
no"
save_total_limit
:
0
plot_loss
:
true
overwrite_output_dir
:
true
save_only_model
:
false
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### train
per_device_train_batch_size
:
16
gradient_accumulation_steps
:
2
learning_rate
:
1.0e-5
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
resume_from_checkpoint
:
null
### eval
# val_size: 0.1
# per_device_eval_batch_size: 1
# eval_strategy: steps
# eval_steps: 500
docker-hub/qwen2.5-vl/llama-factory/examples/train_lora/llama3_lora_dpo.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
trust_remote_code
:
true
### method
stage
:
dpo
do_train
:
true
finetuning_type
:
lora
lora_rank
:
8
lora_target
:
all
pref_beta
:
0.1
pref_loss
:
sigmoid
# choices: [sigmoid (dpo), orpo, simpo]
### dataset
dataset
:
dpo_en_demo
template
:
llama3
cutoff_len
:
2048
max_samples
:
1000
overwrite_cache
:
true
preprocessing_num_workers
:
16
dataloader_num_workers
:
4
### output
output_dir
:
saves/llama3-8b/lora/dpo
logging_steps
:
10
save_steps
:
500
plot_loss
:
true
overwrite_output_dir
:
true
save_only_model
:
false
report_to
:
none
# choices: [none, wandb, tensorboard, swanlab, mlflow]
### train
per_device_train_batch_size
:
1
gradient_accumulation_steps
:
8
learning_rate
:
5.0e-6
num_train_epochs
:
3.0
lr_scheduler_type
:
cosine
warmup_ratio
:
0.1
bf16
:
true
ddp_timeout
:
180000000
resume_from_checkpoint
:
null
### eval
# eval_dataset: dpo_en_demo
# val_size: 0.1
# per_device_eval_batch_size: 1
# eval_strategy: steps
# eval_steps: 500
docker-hub/qwen2.5-vl/llama-factory/examples/train_lora/llama3_lora_eval.yaml
0 → 100644
View file @
5ed76316
### model
model_name_or_path
:
meta-llama/Meta-Llama-3-8B-Instruct
adapter_name_or_path
:
saves/llama3-8b/lora/sft
trust_remote_code
:
true
### method
finetuning_type
:
lora
### dataset
task
:
mmlu_test
# choices: [mmlu_test, ceval_validation, cmmlu_test]
template
:
fewshot
lang
:
en
n_shot
:
5
### output
save_dir
:
saves/llama3-8b/lora/eval
### eval
batch_size
:
4
Prev
1
2
3
4
5
6
7
8
9
…
15
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment