# This file will be included in the generated language-specific task configs. # It doesn't have a yaml file extension as it is not meant to be imported directly by the harness. group: - mgsm - afrimgsm - afrimgsm_en_cot dataset_path: masakhane/afrimgsm dataset_name: null # Overridden by language-specific config. output_type: generate_until training_split: train test_split: test generation_kwargs: until: - "\n\n" - "\n" do_sample: false temperature: 0.0 target_delimiter: " " metric_list: - metric: exact_match aggregation: mean higher_is_better: true ignore_case: true ignore_punctuation: true filter_list: - name: "strict-match" filter: - function: "regex" regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)" - function: "take_first" - filter: - function: regex group_select: -1 regex_pattern: (-?[$0-9.,]{2,})|(-?[0-9]+) - function: take_first name: flexible-extract metadata: version: 2.0