group: afrimgsm-irokobench task: - afrimgsm_tasks_prompt_1 - afrimgsm_tasks_prompt_2 - afrimgsm_tasks_prompt_3 - afrimgsm_tasks_prompt_4 - afrimgsm_tasks_prompt_5 aggregate_metric_list: - metric: acc aggregation: mean weight_by_size: true metadata: version: 2