extended|ifeval|0|0
custom|hellaswag|0|1
custom|arc|0|1
custom|piqa|0|1
custom|mmlu_pro|0|1
custom|bbh|3|1
custom|gsm8k|5|1