Unverified Commit 932e8f9e authored by Firoj Alam, Scientist, QCRI's avatar Firoj Alam, Scientist, QCRI Committed by GitHub
Browse files

AraDICE task config file (#2507)



* added aradice

* Added ArabicMMLU Lev Configs

* added ArabicMMLU egy configs

* Added boolq configs

* Added cultural bench configs

* added openbookqa configs

* Added PiQA configs

* added winogrande configs

* Added truthfulQA configs

* Added aradice group config

* Remove deleted files from repository

* modified arabimmlu configs

* modified metadata versions

* fixed formatting using ruff

* added aradice tasks information

* pre-commit

* Uptaded openbookqa utils

* fixed formatting on obqa

---------
Co-authored-by: default avatarBasel Mousi <bmousi@hbku.edu.qa>
Co-authored-by: default avatarBaber <baber@hey.com>
parent b86aa213
"dataset_name": "middle_stem_computer-science"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_stem_egy"
"task": "AraDiCE_ArabicMMLU_middle_stem_computer-science_egy"
"task_alias": "middle stem computer-science"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "middle_stem_natural-science"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_stem_egy"
"task": "AraDiCE_ArabicMMLU_middle_stem_natural-science_egy"
"task_alias": "middle stem natural-science"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "na_humanities_islamic-studies"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_humanities_egy"
"task": "AraDiCE_ArabicMMLU_na_humanities_islamic-studies_egy"
"task_alias": "na humanities islamic-studies"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "na_language_arabic-language-general"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_language_egy"
"task": "AraDiCE_ArabicMMLU_na_language_arabic-language-general_egy"
"task_alias": "na language arabic-language-general"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "na_language_arabic-language-grammar"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_language_egy"
"task": "AraDiCE_ArabicMMLU_na_language_arabic-language-grammar_egy"
"task_alias": "na language arabic-language-grammar"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "na_other_driving-test"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_other_egy"
"task": "AraDiCE_ArabicMMLU_na_other_driving-test_egy"
"task_alias": "na other driving-test"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "na_other_general-knowledge"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_other_egy"
"task": "AraDiCE_ArabicMMLU_na_other_general-knowledge_egy"
"task_alias": "na other general-knowledge"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_humanities_history"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_humanities_egy"
"task": "AraDiCE_ArabicMMLU_primary_humanities_history_egy"
"task_alias": "primary humanities history"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_humanities_islamic-studies"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_humanities_egy"
"task": "AraDiCE_ArabicMMLU_primary_humanities_islamic-studies_egy"
"task_alias": "primary humanities islamic-studies"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_language_arabic-language"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_language_egy"
"task": "AraDiCE_ArabicMMLU_primary_language_arabic-language_egy"
"task_alias": "primary language arabic-language"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_other_general-knowledge"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_other_egy"
"task": "AraDiCE_ArabicMMLU_primary_other_general-knowledge_egy"
"task_alias": "primary other general-knowledge"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_social-science_geography"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_social-science_egy"
"task": "AraDiCE_ArabicMMLU_primary_social-science_geography_egy"
"task_alias": "primary social-science geography"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_social-science_social-science"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_social-science_egy"
"task": "AraDiCE_ArabicMMLU_primary_social-science_social-science_egy"
"task_alias": "primary social-science social-science"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_stem_computer-science"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_stem_egy"
"task": "AraDiCE_ArabicMMLU_primary_stem_computer-science_egy"
"task_alias": "primary stem computer-science"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_stem_math"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_stem_egy"
"task": "AraDiCE_ArabicMMLU_primary_stem_math_egy"
"task_alias": "primary stem math"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "primary_stem_natural-science"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_stem_egy"
"task": "AraDiCE_ArabicMMLU_primary_stem_natural-science_egy"
"task_alias": "primary stem natural-science"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "prof_humanities_law"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_humanities_egy"
"task": "AraDiCE_ArabicMMLU_prof_humanities_law_egy"
"task_alias": "prof humanities law"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "univ_other_management"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_other_egy"
"task": "AraDiCE_ArabicMMLU_univ_other_management_egy"
"task_alias": "univ other management"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "univ_social-science_accounting"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_social-science_egy"
"task": "AraDiCE_ArabicMMLU_univ_social-science_accounting_egy"
"task_alias": "univ social-science accounting"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
"dataset_name": "univ_social-science_economics"
"description": ""
"fewshot_split": !!null "null"
"include": "_default_template_yaml"
"tag": "AraDiCE_ArabicMMLU_social-science_egy"
"task": "AraDiCE_ArabicMMLU_univ_social-science_economics_egy"
"task_alias": "univ social-science economics"
"test_split": "test"
"training_split": !!null "null"
"validation_split": !!null "null"
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment