Status Job Pipeline Stage Name Duration Coverage
failed #10524
NV_megatron_lm_core_0.9
c9289b90
ssh_selene_runner allowed to fail
#1851 by liangjing's avatar cleanup cleanup.selene

failed #10523
dtk-24.04_megatron-lm_core_0.9
f2464dc2
ssh_selene_runner allowed to fail
#1850 by liangjing's avatar cleanup cleanup.selene

canceled #10522
NV_megatron_lm_core_0.9
64c0033e
ssh_selene_runner allowed to fail
#1849 by liangjing's avatar cleanup cleanup.selene

failed #10521
dtk-24.04_megatron-lm_core_0.9
0b5cd1a0
ssh_selene_runner allowed to fail
#1848 by liangjing's avatar cleanup cleanup.selene

canceled #10520
dtk-24.04_megatron-lm_core_0.9
5352a639
ssh_selene_runner allowed to fail
#1847 by liangjing's avatar cleanup cleanup.selene

failed #10480
NV_megatron_lm_core_0.9
4b097dee
ssh_selene_runner allowed to fail
#1840 by liangjing's avatar cleanup cleanup.selene

failed #10240
dtk-24.04_megatron-lm_core_0.9
4b097dee
ssh_selene_runner allowed to fail
#1807 by liangjing's avatar cleanup cleanup.selene

canceled #10239
dtk-24.04_megatron-lm_core_0.9
3aca1415
ssh_selene_runner allowed to fail
#1806 by liangjing's avatar cleanup cleanup.selene

failed #5697
3.0.2+das1.1
3aca1415
ssh_selene_runner allowed to fail
#1066 by liangjing's avatar cleanup cleanup.selene

failed #4983
main
3aca1415
ssh_selene_runner allowed to fail
#952 by liangjing's avatar cleanup cleanup.selene

failed #4982
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test resume.checkpoint.bert.345m_tp1_pp2_1node

failed #4981
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test train.bert.345m_tp1_pp4_1node_50steps

failed #4980
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test train.bert.345m_tp1_pp2_1node_50steps

failed #4979
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test train.bert.345m_tp2_pp2_1node_50steps

failed #4978
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test train.bert.345m_tp4_pp1_1node_50steps

failed #4977
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test resume.checkpoint.gpt3.345m_tp1_pp2_1node

failed #4976
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test train.gpt3.345m_tp1_pp4_1node_50steps

failed #4975
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test train.gpt3.345m_tp1_pp2_1node_50steps

failed #4974
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test train.gpt3.345m_tp2_pp2_1node_50steps

failed #4973
main
3aca1415
ssh_selene_runner
#952 by liangjing's avatar test train.gpt3.345m_tp4_pp1_1node_50steps

failed #4972
refs/merge-requests/1/head
1005e9d3
ssh_selene_runner allowed to fail
#951 by liangjing's avatar cleanup cleanup.selene

failed #4971
refs/merge-requests/1/head
1005e9d3
docker_local_runner
#951 by liangjing's avatar test unit_tests

failed #4970
megatron-lm_dtk24.04
1005e9d3
ssh_selene_runner allowed to fail
#950 by liangjing's avatar cleanup cleanup.selene

failed #4277
megatron-lm_dtk24.04
051f58f1
ssh_selene_runner allowed to fail
#829 by liangjing's avatar cleanup cleanup.selene

failed #807
dtk-22.10_megatron-lm3.0.2
5602760a
#230 by zhuwenwen's avatar test test

failed #806
main
0024a5c6
ssh_selene_runner allowed to fail
#229 by zhuwenwen's avatar cleanup cleanup.selene

failed #805
main
0024a5c6
ssh_selene_runner
#229 by zhuwenwen's avatar test resume.checkpoint.bert.345m_tp1_pp2_1node

failed #804
main
0024a5c6
ssh_selene_runner
#229 by zhuwenwen's avatar test train.bert.345m_tp1_pp4_1node_50steps

failed #803
main
0024a5c6
ssh_selene_runner
#229 by zhuwenwen's avatar test train.bert.345m_tp1_pp2_1node_50steps

failed #802
main
0024a5c6
ssh_selene_runner
#229 by zhuwenwen's avatar test train.bert.345m_tp2_pp2_1node_50steps