MCORE_MISTRAL= MCORE_CLIP= OUTPUT_DIR= python examples/multimodal/combine_state_dicts.py \ --input \ ${MCORE_MISTRAL}/iter_0000001/mp_rank_00/model_optim_rng.pt \ ${MCORE_CLIP}/iter_0000001/mp_rank_00/model_optim_rng.pt \ ${MCORE_MISTRAL}/iter_0000001/mp_rank_01/model_optim_rng.pt \ ${MCORE_CLIP}/iter_0000001/mp_rank_01/model_optim_rng.pt \ ${MCORE_MISTRAL}/iter_0000001/mp_rank_02/model_optim_rng.pt \ ${MCORE_CLIP}/vit-mcore-336px-tp4/iter_0000001/mp_rank_02/model_optim_rng.pt \ ${MCORE_MISTRAL}/iter_0000001/mp_rank_03/model_optim_rng.pt \ ${MCORE_CLIP}/iter_0000001/mp_rank_03/model_optim_rng.pt \ --prefixes language_model vision_model language_model vision_model language_model vision_model language_model vision_model \ --output \ ${OUTPUT_DIR}/mistral_instruct_clip336_tp4_combined_mcore/iter_0000001/mp_rank_00/model_optim_rng.pt \ ${OUTPUT_DIR}/mistral_instruct_clip336_tp4_combined_mcore/iter_0000001/mp_rank_01/model_optim_rng.pt \ ${OUTPUT_DIR}/mistral_instruct_clip336_tp4_combined_mcore/iter_0000001/mp_rank_02/model_optim_rng.pt \ ${OUTPUT_DIR}/mistral_instruct_clip336_tp4_combined_mcore/iter_0000001/mp_rank_03/model_optim_rng.pt