include: niah_single_1.yaml task: ruler_qa_squad download_dataset: !function qa_utils.get_squad test_split: test generation_kwargs: do_sample: false temperature: 0.0 max_gen_toks: 32 until: []