Unverified Commit 4bb92ebc authored by Jess's avatar Jess Committed by GitHub
Browse files

Merge pull request #18 from JessicaOjo/africamgsm

fix exact match bug and restructure mmlu folder
parents 348e304a 5ba791e2
......@@ -1367,6 +1367,13 @@ class ConfigurableTask(Task):
result_score = 0.0
else:
try:
if metric == "exact_match":
result_score = self._metric_fn_list[metric](
references=[str(gold)],
predictions=[str(result)],
**self._metric_fn_kwargs[metric],
)
else:
result_score = self._metric_fn_list[metric](
references=[gold],
predictions=[result],
......
......@@ -4,7 +4,7 @@ models=(
"gpt-3.5-turbo"
"gpt-4-0125-preview"
)
task=afrimgsm_direct_eng,afrimgsm_direct_fra,afrimgsm_direct_swa #afrimgsm_direct_ewe,afrimgsm_direct_fra,afrimgsm_direct_hau,afrimgsm_direct_ibo,afrimgsm_direct_kin,afrimgsm_direct_lin,afrimgsm_direct_lug,afrimgsm_direct_orm,afrimgsm_direct_sna,afrimgsm_direct_sot,afrimgsm_direct_swa,afrimgsm_direct_twi,afrimgsm_direct_wol,afrimgsm_direct_xho,afrimgsm_direct_yor,afrimgsm_direct_zul
task=afrimgsm_direct_amh,afrimgsm_direct_eng,afrimgsm_direct_ewe,afrimgsm_direct_fra,afrimgsm_direct_hau,afrimgsm_direct_ibo,afrimgsm_direct_kin,afrimgsm_direct_lin,afrimgsm_direct_lug,afrimgsm_direct_orm,afrimgsm_direct_sna,afrimgsm_direct_sot,afrimgsm_direct_swa,afrimgsm_direct_twi,afrimgsm_direct_wol,afrimgsm_direct_xho,afrimgsm_direct_yor,afrimgsm_direct_zul
for model in "${models[@]}"
do
......
dataset_name: amh
include: afrimmlu_common_yaml
task: afrimmlu_amh
task: afrimmlu_direct_amh
dataset_name: eng
include: afrimmlu_common_yaml
task: afrimmlu_eng
task: afrimmlu_direct_eng
dataset_name: ewe
include: afrimmlu_common_yaml
task: afrimmlu_ewe
task: afrimmlu_direct_ewe
dataset_name: fra
include: afrimmlu_common_yaml
task: afrimmlu_fra
\ No newline at end of file
task: afrimmlu_direct_fra
\ No newline at end of file
dataset_name: hau
include: afrimmlu_common_yaml
task: afrimmlu_hau
\ No newline at end of file
task: afrimmlu_direct_hau
\ No newline at end of file
dataset_name: ibo
include: afrimmlu_common_yaml
task: afrimmlu_ibo
\ No newline at end of file
task: afrimmlu_direct_ibo
\ No newline at end of file
dataset_name: kin
include: afrimmlu_common_yaml
task: afrimmlu_kin
\ No newline at end of file
task: afrimmlu_direct_kin
\ No newline at end of file
dataset_name: lin
include: afrimmlu_common_yaml
task: afrimmlu_lin
\ No newline at end of file
task: afrimmlu_direct_lin
\ No newline at end of file
dataset_name: lug
include: afrimmlu_common_yaml
task: afrimmlu_lug
\ No newline at end of file
task: afrimmlu_direct_lug
\ No newline at end of file
dataset_name: orm
include: afrimmlu_common_yaml
task: afrimmlu_orm
\ No newline at end of file
task: afrimmlu_direct_orm
\ No newline at end of file
dataset_name: sna
include: afrimmlu_common_yaml
task: afrimmlu_sna
\ No newline at end of file
task: afrimmlu_direct_sna
\ No newline at end of file
dataset_name: sot
include: afrimmlu_common_yaml
task: afrimmlu_sot
\ No newline at end of file
task: afrimmlu_direct_sot
\ No newline at end of file
dataset_name: swa
include: afrimmlu_common_yaml
task: afrimmlu_swa
\ No newline at end of file
task: afrimmlu_direct_swa
\ No newline at end of file
dataset_name: twi
include: afrimmlu_common_yaml
task: afrimmlu_twi
\ No newline at end of file
task: afrimmlu_direct_twi
\ No newline at end of file
dataset_name: wol
include: afrimmlu_common_yaml
task: afrimmlu_wol
\ No newline at end of file
task: afrimmlu_direct_wol
\ No newline at end of file
dataset_name: xho
include: afrimmlu_common_yaml
task: afrimmlu_xho
\ No newline at end of file
task: afrimmlu_direct_xho
\ No newline at end of file
dataset_name: yor
include: afrimmlu_common_yaml
task: afrimmlu_yor
\ No newline at end of file
task: afrimmlu_direct_yor
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment