mgsm_chat.yaml 1.34 KB
Newer Older
Baber's avatar
Baber committed
1
2
3
4
5
6
7
8
9
tag: llama3
task: mgsm_chat
dataset_path: meta-llama/Llama-3.2-3B-Instruct-evals
dataset_name: Llama-3.2-3B-Instruct-evals__mgsm__details
output_type: generate_until
test_split: latest
doc_to_text: "{{
    input_final_prompts
    |first
Baber's avatar
Baber committed
10
    |replace('<|start_header_id|>user<|end_header_id|>', '')
Baber's avatar
Baber committed
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
    |replace('<|eot_id|><|start_header_id|>assistant<|end_header_id|>', '')
    |trim
}}"
doc_to_target: "input_correct_responses"
process_results: !function utils.process_results_mgsm
generation_kwargs:
  until: []
  do_sample: false
  temperature: 0.0
  max_gen_toks: 2048
metric_list:
  - metric: exact_match
    aggregation: mean
    higher_is_better: true
    ignore_case: true
    ignore_punctuation: true
filter_list:
  - name: "strict-match"
    filter:
      - function: "regex"
31
        regex_pattern: "(?:Answer|Réponse|Antwort|Ответ|Respuesta|答え|Jibu|答案|คำตอบ|సమాధానం|উত্তর): (\\-?[0-9\\.\\,]+)"
Baber's avatar
Baber committed
32
33
      - function: remove_whitespace
      - function: take_first
Baber's avatar
Baber committed
34
35
36
37
  - name: "flexible-extract"
    filter:
      - function: regex
        group_select: -1
38
        regex_pattern: "(?:Answer|Réponse|Antwort|Ответ|Respuesta|答え|Jibu|答案|คำตอบ|సమాధానం|উত্তর): (-?[$0-9.,]{2,})|(-?[0-9]+)"
Baber's avatar
Baber committed
39
40
41
42
      - function: remove_whitespace
      - function: take_first
metadata:
  version: 0.0