task: squadv2 dataset_path: squad_v2 output_type: greedy_until training_split: train validation_split: validation doc_to_text: "Title: {{title}}\n\nBackground: {{context}}\n\nQuestion: {{question}}\n\n Answer:" doc_to_target: "{% if answers.text| length > 0 %}{{answers.text}}{% else %}{{['unanswerable']}}{% endif %}" target_delimiter: "" should_decontaminate: true doc_to_decontamination_query: context process_results: !function utils.process_results generation_kwargs: until: - "\n\n" - "\n" do_sample: false temperature: 0.0 filter_list: - name: remove_whitespace filter: - function: remove_whitespace - function: take_first metric_list: - metric: !function metric.exact aggregation: mean higher_is_better: true - metric: !function metric.f1 aggregation: mean higher_is_better: true - metric: !function metric.HasAns_exact aggregation: mean higher_is_better: true - metric: !function metric.HasAns_f1 aggregation: mean higher_is_better: true - metric: !function metric.NoAns_exact aggregation: mean higher_is_better: true - metric: !function metric.NoAns_f1 aggregation: mean higher_is_better: true - metric: !function metric.best_exact aggregation: mean higher_is_better: true - metric: !function metric.best_f1 aggregation: mean higher_is_better: true