tag: - longbench_e task: longbench_2wikimqa_e dataset_path: THUDM/LongBench test_split: test dataset_name: 2wikimqa_e doc_to_text: "Answer the question based on the given passages. Only give me the answer and do not output any other words.\n\nThe following are given passages.\n{{context}}\n\nAnswer the question based on the given passages. Only give me the answer and do not output any other words.\n\nQuestion: {{input}}\nAnswer:" doc_to_target: '{{answers}}' process_results: !function metrics.get_qa_f1_score generation_kwargs: max_gen_toks: 32 temperature: 1 do_sample: False until: [] metric_list: - metric: "qa_f1_score" aggregation: mean higher_is_better: True metadata: version: 4.0