group: grouptest task: - boolq - group: arc_stuff task: - arc_challenge - glue - task: arc_easy metric_list: - metric: acc num_fewshot: 3 # - task: mmlu # num_fewshot: 2