dataset_path: HAERAE-HUB/HRM8K output_type: generate_until test_split: test doc_to_text: !function utils.doc_to_text doc_to_target: !function utils.doc_to_target process_results: !function utils.process_results num_fewshot: 0 generation_kwargs: until: - "" - "<|end_of_text|>" - "<|endoftext|>" - "<|im_end|>" max_gen_toks: 2048 do_sample: false temperature: 0 metric_list: - metric: exact_match aggregation: mean higher_is_better: true metadata: version: 1.1