_wandb: value: cli_version: 0.19.1 m: [] python_version: 3.10.12 t: "1": - 1 - 11 - 41 - 49 - 55 - 71 "2": - 1 - 11 - 41 - 49 - 55 - 71 "3": - 13 - 16 - 23 - 55 "4": 3.10.12 "5": 0.19.1 "6": 4.47.0 "8": - 5 "12": 0.19.1 "13": linux-x86_64 anyres_grids: value: - - 1 - 2 - - 2 - 1 - - 2 - 2 - - 3 - 1 - - 1 - 3 anyres_patch_sampling: value: true batch_size: value: 8 checkpoint_steps: value: 5000 conv_template_name: value: phi_3 cpu_offload_gradients: value: false cross_attn_every_n_layers: value: 1 data_path: value: /mnt/xgen-mm/LAVIS/data_configs/example_data_config.yaml data_sampler_group_by_length: value: true delete_previous_checkpoint: value: false device: value: cuda:0 dist_backend: value: nccl dist_url: value: env:// distributed: value: true dryrun: value: false fsdp: value: true fsdp_sharding_strategy: value: hybrid gradient_accumulation_steps: value: 1 gradient_checkpointing: value: true horovod: value: false image_aspect_ratio: value: anyres is_multimodal: value: true learning_rate: value: 2e-05 lm_path: value: microsoft/Phi-3-mini-4k-instruct local_rank: value: 0 logging_steps: value: 100 loss: value: supervised_finetune lr_scheduler: value: cosine mm_use_im_start_end: value: false model_family: value: xgenmm_v1 no_save_optim_state: value: true no_set_device_rank: value: false num_epochs: value: 1 num_vision_tokens: value: 128 offline: value: false precision: value: amp_bf16 pretrained: value: /mnt/xgen-mm/xgen-mm-phi3-mini-base-r-v1.5.pt pretrained_vision_tokenizer: value: null rank: value: 0 report_to_wandb: value: true resume_from_checkpoint: value: null run_name: value: finetune-xgenmmv1-phi3_4k_instruct-example_data_config save_checkpoints_to_wandb: value: false seed: value: 42 tokenizer_path: value: microsoft/Phi-3-mini-4k-instruct unfreeze_vision_encoder: value: false use_flash_attention_2: value: false vision_encoder_path: value: google/siglip-so400m-patch14-384 vision_encoder_precision: value: fp32 vision_encoder_pretrained: value: google wandb_entity: value: null wandb_project: value: blip3-xgenmm-finetune warmup_steps: value: 2000 weight_decay: value: 0 workers: value: 4 world_size: value: 8