_template_mc 427 Bytes
Newer Older
Baber's avatar
Baber committed
1
2
3
4
5
6
7
8
9
10
dataset_path: mrlbenchmarks/global-piqa-nonparallel
output_type: multiple_choice
test_split: test
doc_to_text: prompt
doc_to_target: label
doc_to_choice: "{{[solution0, solution1]}}"
metric_list:
  - metric: acc
    aggregation: mean
    higher_is_better: true
Baber's avatar
Baber committed
11
12
13
  - metric: acc_norm
    aggregation: mean
    higher_is_better: true
Baber's avatar
Baber committed
14
15
16
  - metric: acc_bytes
    aggregation: mean
    higher_is_better: true
Baber's avatar
Baber committed
17
18
metadata:
  version: 1.0