tag: - longbench_e task: longbench_multi_news_e dataset_path: THUDM/LongBench test_split: test dataset_name: multi_news_e doc_to_text: "You are given several news passages. Write a one-page summary of all news. \n\nNews:\n{{context}}\n\nNow, write a one-page summary of all the news.\n\nSummary:" doc_to_target: '{{answers}}' process_results: !function metrics.get_rouge_score generation_kwargs: max_gen_toks: 512 temperature: 1 do_sample: False until: [] metric_list: - metric: "rouge_score" aggregation: mean higher_is_better: True metadata: version: 4.0