afrimmlu_common_yaml 910 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
group:
  - mmlu
  - afrimmlu
  - afrimmlu_direct
task: null
dataset_path: masakhane/afrimmlu
dataset_name: null
output_type: multiple_choice
validation_split: validation
test_split: test
fewshot_split: validation
Lintang Sutawika's avatar
Lintang Sutawika committed
12
doc_to_text: !function utils.doc_to_text
13
14
15
16
17
doc_to_target: "{{['A', 'B', 'C', 'D'].index(answer)}}"
doc_to_choice: !function utils.doc_to_choice
should_decontaminate: true
doc_to_decontamination_query: "Question: {{question}}\nAnswer:"
metric_list:
Lintang Sutawika's avatar
Lintang Sutawika committed
18
19
  - metric: f1
    aggregation: !function utils.weighted_f1_score
20
    # aggregation: mean
Lintang Sutawika's avatar
Lintang Sutawika committed
21
22
23
    average: weighted
    hf_evaluate: true
    higher_is_better: True
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
    ignore_case: true
    ignore_punctuation: true
    regexes_to_ignore:
      - ","
      - "\\$"
  - metric: acc
    aggregation: mean
    higher_is_better: true
    ignore_case: true
    ignore_punctuation: true
    regexes_to_ignore:
      - ","
      - "\\$"
metadata:
  version: 1.0