group: arabicmmlu_stem group_alias: stem task: - arabicmmlu_stem_tasks aggregate_metric_list: - metric: acc weight_by_size: True metadata: version: 0