group: arabicmmlu_social_science group_alias: social_science task: - arabicmmlu_social_science_tasks aggregate_metric_list: - metric: acc weight_by_size: True metadata: version: 0