"...fattn-vec-f16-instance-hs64-f16-q4_0.cu" did not exist on "217903ab5111124041b3bb9d7a04d9101f2f32b2"
config.yaml 2.81 KB
Newer Older
yangzhong's avatar
v1.0  
yangzhong committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
_wandb:
    value:
        cli_version: 0.19.1
        m: []
        python_version: 3.10.12
        t:
            "1":
                - 1
                - 11
                - 41
                - 49
                - 55
                - 71
            "2":
                - 1
                - 11
                - 41
                - 49
                - 55
                - 71
            "3":
                - 13
                - 16
                - 23
                - 55
            "4": 3.10.12
            "5": 0.19.1
            "6": 4.47.0
            "8":
                - 5
            "12": 0.19.1
            "13": linux-x86_64
anyres_grids:
    value:
        - - 1
          - 2
        - - 2
          - 1
        - - 2
          - 2
        - - 3
          - 1
        - - 1
          - 3
anyres_patch_sampling:
    value: true
batch_size:
    value: 8
checkpoint_steps:
    value: 5000
conv_template_name:
    value: phi_3
cpu_offload_gradients:
    value: false
cross_attn_every_n_layers:
    value: 1
data_path:
    value: /mnt/xgen-mm/LAVIS/data_configs/example_data_config.yaml
data_sampler_group_by_length:
    value: true
delete_previous_checkpoint:
    value: false
device:
    value: cuda:0
dist_backend:
    value: nccl
dist_url:
    value: env://
distributed:
    value: true
dryrun:
    value: false
fsdp:
    value: true
fsdp_sharding_strategy:
    value: hybrid
gradient_accumulation_steps:
    value: 1
gradient_checkpointing:
    value: true
horovod:
    value: false
image_aspect_ratio:
    value: anyres
is_multimodal:
    value: true
learning_rate:
    value: 2e-05
lm_path:
    value: microsoft/Phi-3-mini-4k-instruct
local_rank:
    value: 0
logging_steps:
    value: 100
loss:
    value: supervised_finetune
lr_scheduler:
    value: cosine
mm_use_im_start_end:
    value: false
model_family:
    value: xgenmm_v1
no_save_optim_state:
    value: true
no_set_device_rank:
    value: false
num_epochs:
    value: 1
num_vision_tokens:
    value: 128
offline:
    value: false
precision:
    value: amp_bf16
pretrained:
    value: /mnt/xgen-mm/xgen-mm-phi3-mini-base-r-v1.5.pt
pretrained_vision_tokenizer:
    value: null
rank:
    value: 0
report_to_wandb:
    value: true
resume_from_checkpoint:
    value: null
run_name:
    value: finetune-xgenmmv1-phi3_4k_instruct-example_data_config
save_checkpoints_to_wandb:
    value: false
seed:
    value: 42
tokenizer_path:
    value: microsoft/Phi-3-mini-4k-instruct
unfreeze_vision_encoder:
    value: false
use_flash_attention_2:
    value: false
vision_encoder_path:
    value: google/siglip-so400m-patch14-384
vision_encoder_precision:
    value: fp32
vision_encoder_pretrained:
    value: google
wandb_entity:
    value: null
wandb_project:
    value: blip3-xgenmm-finetune
warmup_steps:
    value: 2000
weight_decay:
    value: 0
workers:
    value: 4
world_size:
    value: 8