sciq.yaml 764 Bytes
Newer Older
lintangsutawika's avatar
lintangsutawika committed
1
group:
2
3
  - multiple_choice
task: sciq
haileyschoelkopf's avatar
haileyschoelkopf committed
4
5
6
7
8
9
10
11
dataset_path: sciq
dataset_name: null
output_type: multiple_choice
training_split: train
validation_split: validation
test_split: test
template_aliases: "{% set answer_choices = [distractor1, distractor2, distractor3, correct_answer] %}{% set gold = 3 %}" # set the list of possible answer choices, and set what this doc's gold label idx is
doc_to_text: "{{support.lstrip()}}\nQuestion: {{question}}\nAnswer:"
lintangsutawika's avatar
lintangsutawika committed
12
13
doc_to_target: " {{correct_answer}}"
gold_alias: "{{gold}}" # this will be cast to an int.
haileyschoelkopf's avatar
haileyschoelkopf committed
14
15
16
17
18
19
20
21
22
metric_list:
  - metric: acc
    aggregation: mean
    higher_is_better: true
  - metric: acc_norm
    aggregation: mean
    higher_is_better: true
  - metric: acc_mutual_info
    aggregation: mean
lintangsutawika's avatar
lintangsutawika committed
23
    higher_is_better: true