group: bbh dataset_path: lukaemon/bbh output_type: greedy_until test_split: test doc_to_text: "Q: {{input}}\nA:" doc_to_target: "{{target}}" metric_list: - metric: exact_match aggregation: mean higher_is_better: true generation_kwargs: until: - "" do_sample: false temperature: 0.0