include: _template_yaml task: squadv2 output_type: generate_until generation_kwargs: until: - "\n" metric_list: - metric: !function utils.exact aggregation: mean higher_is_better: true - metric: !function utils.f1 aggregation: mean higher_is_better: true