group: mmlu_stem group_alias: stem task: - mmlu_stem_tasks aggregate_metric_list: - metric: acc weight_by_size: True
- metric: acc_norm weight_by_size: True
metadata:
version: 2