"lm_eval/tasks/belebele/belebele_amh_Ethi.yaml" did not exist on "0aa37743218177935bcdcbbf8576c98a6b4810ac"
metabench.yaml 266 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
group: metabench
task:
  - metabench_arc
  - metabench_gsm8k
  - metabench_hellaswag
  - metabench_mmlu
  - metabench_truthfulqa
  - metabench_winogrande
aggregate_metric_list:
  - metric: acc
    aggregation: mean
    weight_by_size: false
metadata:
  version: 0.0