_translate_yaml 860 Bytes
Newer Older
1
2
3
4
5
6
7
8
group:
  - mmlu
  - afrimmlu_translate
task: null
dataset_path: masakhane/afrimmlu-translate-test
dataset_name: null
output_type: multiple_choice
test_split: test
lintangsutawika's avatar
lintangsutawika committed
9
doc_to_text: !function utils.doc_to_text
10
11
12
13
14
doc_to_target: "{{['A', 'B', 'C', 'D'].index(answer)}}"
doc_to_choice: !function utils.doc_to_choice
should_decontaminate: true
doc_to_decontamination_query: "Question: {{question}}\nAnswer:"
metric_list:
lintangsutawika's avatar
lintangsutawika committed
15
16
  - metric: f1
    aggregation: !function utils.weighted_f1_score
17
    # aggregation: mean
lintangsutawika's avatar
lintangsutawika committed
18
19
20
    average: weighted
    hf_evaluate: true
    higher_is_better: True
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
    ignore_case: true
    ignore_punctuation: true
    regexes_to_ignore:
      - ","
      - "\\$"
  - metric: acc
    aggregation: mean
    higher_is_better: true
    ignore_case: true
    ignore_punctuation: true
    regexes_to_ignore:
      - ","
      - "\\$"
metadata:
  version: 1.0