Merge branch 'main' into autobatchtest

# Conflicts: # lm_eval/models/huggingface.py

Merge branch 'main' into autobatchtest
# Conflicts: # lm_eval/models/huggingface.py
948f120f · Baber · a5b1c7a8 · bd80a6c0 · 948f120f · 948f120f
Commit 948f120f authored Nov 09, 2024 by Baber
20 changed files
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_ca-eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_ca-eu.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_ca-eu
+doc_to_text: 'Catalan sentence: {{sentence_cat_Latn}}
+
+  Basque sentence:'
+doc_to_target: '{{sentence_eus_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_de-eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_de-eu.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_de-eu
+doc_to_text: 'German sentence: {{sentence_deu_Latn}}
+
+  Basque sentence:'
+doc_to_target: '{{sentence_eus_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_en-eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_en-eu.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_en-eu
+doc_to_text: 'English sentence: {{sentence_eng_Latn}}
+
+  Basque sentence:'
+doc_to_target: '{{sentence_eus_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_es-eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_es-eu.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_es-eu
+doc_to_text: 'Spanish sentence: {{sentence_spa_Latn}}
+
+  Basque sentence:'
+doc_to_target: '{{sentence_eus_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu-ca.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu-ca.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_eu-ca
+doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
+
+  Catalan sentence:'
+doc_to_target: '{{sentence_cat_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu-de.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu-de.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_eu-de
+doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
+
+  German sentence:'
+doc_to_target: '{{sentence_deu_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu-en.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu-en.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_eu-en
+doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
+
+  English sentence:'
+doc_to_target: '{{sentence_eng_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu-es.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu-es.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_eu-es
+doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
+
+  Spanish sentence:'
+doc_to_target: '{{sentence_spa_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu-fr.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu-fr.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_eu-fr
+doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
+
+  French sentence:'
+doc_to_target: '{{sentence_fra_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu-gl.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu-gl.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_eu-gl
+doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
+
+  Galician sentence:'
+doc_to_target: '{{sentence_glg_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu-it.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu-it.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_eu-it
+doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
+
+  Italian sentence:'
+doc_to_target: '{{sentence_ita_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu-pt.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu-pt.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_eu-pt
+doc_to_text: 'Basque sentence: {{sentence_eus_Latn}}
+
+  Portuguese sentence:'
+doc_to_target: '{{sentence_por_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_eu.yaml
+group: flores_eu
+task:
+  - flores_es-eu
+  - flores_eu-es
+  - flores_en-eu
+  - flores_eu-en
+  - flores_eu-pt
+  - flores_pt-eu
+  - flores_eu-it
+  - flores_it-eu
+  - flores_eu-fr
+  - flores_fr-eu
+  - flores_eu-ca
+  - flores_ca-eu
+  - flores_eu-gl
+  - flores_gl-eu
+  - flores_eu-de
+  - flores_de-eu
+aggregate_metric_list:
+  - metric: bleu
+    aggregation: mean
+    weight_by_size: false
+metadata:
+  version: 1.0
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_fr-eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_fr-eu.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_fr-eu
+doc_to_text: 'French sentence: {{sentence_fra_Latn}}
+
+  Basque sentence:'
+doc_to_target: '{{sentence_eus_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_gl-eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_gl-eu.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_gl-eu
+doc_to_text: 'Galician sentence: {{sentence_glg_Latn}}
+
+  Basque sentence:'
+doc_to_target: '{{sentence_eus_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_it-eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_it-eu.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_it-eu
+doc_to_text: 'Italian sentence: {{sentence_ita_Latn}}
+
+  Basque sentence:'
+doc_to_target: '{{sentence_eus_Latn}}'
--- a/lm_eval/tasks/basque_bench/flores_eu/flores_pt-eu.yaml
+++ b/lm_eval/tasks/basque_bench/flores_eu/flores_pt-eu.yaml
+# File generated by `create-yamls.py`
+include: _flores_common_yaml
+task: flores_pt-eu
+doc_to_text: 'Portuguese sentence: {{sentence_por_Latn}}
+
+  Basque sentence:'
+doc_to_target: '{{sentence_eus_Latn}}'
--- a/lm_eval/tasks/basque_bench/mgsm_cot_native_eu.yaml
+++ b/lm_eval/tasks/basque_bench/mgsm_cot_native_eu.yaml
+task: mgsm_native_cot_eu
+dataset_path: HiTZ/MGSM-eu
+dataset_name: null
+doc_to_target: '{% if answer is not none %}{{answer[27:]}}{% else %}{{answer_number|string}}{%endif %}'
+doc_to_text: '{% if answer is not none %}{{question+"\nErantzuna urratsez urrats:"}}{% else %}{{"Galdera: "+question+"\nErantzuna urratsez urrats:"}}{% endif %}'
+output_type: generate_until
+training_split: train
+test_split: test
+target_delimiter: " "
+generation_kwargs:
+  until:
+    - "\n\n"
+    - "\n"
+    - "Galdera:"
+    - </s>
+    - <|im_end|>
+  do_sample: false
+  temperature: 0.0
+filter_list:
+  - name: "get-answer"
+    filter:
+      - function: "regex"
+        regex_pattern: "Erantzuna [$%]? ?(-?[0-9]+([ .,][0-9.,]+)?) ?[$%]? da"
+      - function: "take_first"
+metric_list:
+  - metric: exact_match
+    aggregation: mean
+    higher_is_better: true
+    ignore_case: true
+    ignore_punctuation: true
+    regexes_to_ignore:
+      - " "
+metadata:
+  version: 1.0
--- a/lm_eval/tasks/basque_bench/mgsm_direct_eu.yaml
+++ b/lm_eval/tasks/basque_bench/mgsm_direct_eu.yaml
+task: mgsm_direct_eu
+dataset_path: HiTZ/MGSM-eu
+dataset_name: null
+doc_to_target: '{{answer_number|string}}'
+doc_to_text: '{% if answer is not none %}{{question+"\nErantzuna:"}}{% else %}{{"Galdera: "+question+"\nErantzuna:"}}{% endif %}'
+output_type: generate_until
+training_split: train
+test_split: test
+target_delimiter: " "
+generation_kwargs:
+  until:
+    - "\n\n"
+    - "\n"
+    - "Galdera:"
+    - </s>
+    - <|im_end|>
+  do_sample: false
+  temperature: 0.0
+filter_list:
+  - name: remove_whitespace
+    filter:
+      - function: remove_whitespace
+      - function: take_first
+  - name: flexible-extract
+    filter:
+    - function: regex
+      group_select: -1
+      regex_pattern: (-?[0-9]+([ .,][0-9.,]+)?)
+    - function: take_first
+metric_list:
+  - metric: exact_match
+    aggregation: mean
+    higher_is_better: true
+    ignore_case: true
+    ignore_punctuation: true
+    regexes_to_ignore:
+      - " "
+metadata:
+  version: 1.0
--- a/lm_eval/tasks/basque_bench/utils.py
+++ b/lm_eval/tasks/basque_bench/utils.py
+from functools import partial
+
+
+# ~~~~~~~~~~~ XCOPA ~~~~~~~~~~~ #
+
+xcopa_connectors = {"cause": " Izan ere,", "effect": " Beraz,"}
+
+
+def xcopa_doc_to_text(doc):
+    conn = xcopa_connectors[doc["question"]]
+    return doc["premise"].strip() + f"{conn}"
+
+
+def xcopa_doc_to_choice(doc):
+    def convert_choice(choice):
+        return choice[0].lower() + choice[1:]
+
+    return [convert_choice(doc["choice1"]), convert_choice(doc["choice2"])]
+
+
+# ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ #