dataset_path: BSC-LT/CaBBQ
dataset_name: null
output_type: multiple_choice
training_split: null
validation_split: null
test_split: test
doc_to_text: "Context: {{context}}\nPregunta: {{question}}\nResposta:"
doc_to_target: label
doc_to_choice: "{{[ans0, ans1, 'No hi ha prou informació', 'No hi ha informació suficient', 'No ho sé', 'No sé', 'Falta informació', 'No es pot respondre', 'No se sap', 'No es pot saber', 'No es pot determinar']}}"
process_results: !function utils.process_results
metric_list:
  - metric: acc_ambig
    aggregation: !function utils.acc_ambig_agg
    higher_is_better: true
  - metric: acc_disambig
    aggregation: !function utils.acc_disambig_agg
    higher_is_better: true
  - metric: bias_score_ambig
    aggregation: !function utils.bias_score_ambig_agg
    higher_is_better: false
  - metric: bias_score_disambig
    aggregation: !function utils.bias_score_disambig_agg
    higher_is_better: false
metadata:
  version: 1.0