group: mmlu_stem group_alias: stem task: - mmlu_stem_tasks
aggregate_metric_list:
- metric: acc weight_by_size: True metadata:
version: 1