Commit 25869601 authored by Baber's avatar Baber
Browse files

Merge branch 'main' into mathvista

# Conflicts:
#	lm_eval/models/hf_vlms.py
parents 56f40c53 c1d8795d
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_de-gl
doc_to_text: 'German sentence: {{sentence_deu_Latn}}
Galician sentence:'
doc_to_target: '{{sentence_glg_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_en-gl
doc_to_text: 'English sentence: {{sentence_eng_Latn}}
Galician sentence:'
doc_to_target: '{{sentence_glg_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_es-gl
doc_to_text: 'Spanish sentence: {{sentence_spa_Latn}}
Galician sentence:'
doc_to_target: '{{sentence_glg_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_eu-gl
doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
Galician sentence:'
doc_to_target: '{{sentence_glg_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_fr-gl
doc_to_text: 'French sentence: {{sentence_fra_Latn}}
Galician sentence:'
doc_to_target: '{{sentence_glg_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_gl-ca
doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
Catalan sentence:'
doc_to_target: '{{sentence_cat_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_gl-de
doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
German sentence:'
doc_to_target: '{{sentence_deu_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_gl-en
doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
English sentence:'
doc_to_target: '{{sentence_eng_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_gl-es
doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
Spanish sentence:'
doc_to_target: '{{sentence_spa_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_gl-eu
doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
Basque sentence:'
doc_to_target: '{{sentence_eus_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_gl-fr
doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
French sentence:'
doc_to_target: '{{sentence_fra_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_gl-it
doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
Italian sentence:'
doc_to_target: '{{sentence_ita_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_gl-pt
doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
Portuguese sentence:'
doc_to_target: '{{sentence_por_Latn}}'
group: flores_gl
task:
- flores_es-gl
- flores_gl-es
- flores_en-gl
- flores_gl-en
- flores_eu-gl
- flores_gl-eu
- flores_pt-gl
- flores_gl-pt
- flores_it-gl
- flores_gl-it
- flores_fr-gl
- flores_gl-fr
- flores_ca-gl
- flores_gl-ca
- flores_gl-de
- flores_de-gl
aggregate_metric_list:
- metric: bleu
aggregation: mean
weight_by_size: false
metadata:
version: 1.0
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_it-gl
doc_to_text: 'Italian sentence: {{sentence_ita_Latn}}
Galician sentence:'
doc_to_target: '{{sentence_glg_Latn}}'
# File generated by `create-yamls.py`
include: _flores_common_yaml
task: flores_pt-gl
doc_to_text: 'Portuguese sentence: {{sentence_por_Latn}}
Galician sentence:'
doc_to_target: '{{sentence_glg_Latn}}'
task: galcola
dataset_path: proxectonos/galcola
output_type: multiple_choice
training_split: train
validation_split: validation
test_split: test
doc_to_text: "{{sentence}}\nPregunta: Ten sentido esta frase?\nResposta:"
doc_to_target: label
doc_to_choice: ["non", "si"]
should_decontaminate: true
doc_to_decontamination_query: sentence
metric_list:
- metric: mcc
- metric: acc
metadata:
version: 1.0
group: galician_bench
task:
- belebele_glg_Latn
- flores_gl
- galcola
- summarization_gl
- parafrases_gl
- paws_gl
- openbookqa_gl
- mgsm_direct_gl
- truthfulqa_gl
- xnli_gl
- xstorycloze_gl
metadata:
version: 1.0
task: mgsm_direct_gl
dataset_path: proxectonos/mgsm_gl
doc_to_target: '{{answer_number|string}}'
doc_to_text: '{% if answer != None %}{{question + "\nResposta: "}}{% else %}{{"Pregunta: " + question + "\nResposta: "}}{% endif %}'
output_type: generate_until
training_split: train
test_split: test
target_delimiter: ""
generation_kwargs:
until:
- "\n\n"
- "\n"
filter_list:
- name: remove_whitespace
filter:
- function: remove_whitespace
- function: take_first
metric_list:
- metric: exact_match
aggregation: mean
higher_is_better: true
ignore_case: true
ignore_punctuation: true
metadata:
version: 1.0
# Task configuration directly taken from Eleuther AI's implementation as of March 22, 2024
task: openbookqa_gl
dataset_path: proxectonos/openbookqa_gl
output_type: multiple_choice
training_split: null
validation_split: validation
test_split: test
doc_to_text: question_stem
doc_to_target: "{{choices.label.index(answerKey.lstrip())}}"
doc_to_choice: "{{choices.text}}"
should_decontaminate: true
doc_to_decontamination_query: question_stem
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
- metric: acc_norm
aggregation: mean
higher_is_better: true
metadata:
version: 1.0
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment