group: flan_held_out task:
# BBH - bbh_flan_zeroshot - bbh_flan_fewshot - bbh_flan_cot_fewshot - bbh_flan_cot_zeroshot # MMLU - mmlu_flan_n_shot_generative - mmlu_flan_n_shot_loglikelihood - mmlu_flan_cot_zeroshot - mmlu_flan_cot_fewshot