Unverified Commit 3816796e authored by Alexandre Marques's avatar Alexandre Marques Committed by GitHub
Browse files

Adds MMLU CoT, gsm8k and arc_challenge for llama instruct (#2829)

* llama-style MMLU CoT

* Refactor MMLU CoT template YAML to simplify 'until' structure

* Add GSM8K task configuration for LLaMA3 with few-shot examples

* Fix missing newline at end of MMLU CoT YAML file

* Add ARC-Challenge task configuration and processing utility

* Add additional MMLU and ARC-Challenge task variants to README

* Update README with notes on arc_challenge_llama dataset preprocessing
parent 1514ac1e
"dataset_name": "college_physics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_college_physics"
"task_alias": "college physics"
"dataset_name": "computer_security"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_computer_security"
"task_alias": "computer security"
"dataset_name": "conceptual_physics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_conceptual_physics"
"task_alias": "conceptual physics"
"dataset_name": "econometrics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_social_sciences_tasks"
"task": "mmlu_cot_llama_econometrics"
"task_alias": "econometrics"
"dataset_name": "electrical_engineering"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_electrical_engineering"
"task_alias": "electrical engineering"
"dataset_name": "elementary_mathematics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_elementary_mathematics"
"task_alias": "elementary mathematics"
"dataset_name": "formal_logic"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_formal_logic"
"task_alias": "formal logic"
"dataset_name": "global_facts"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_global_facts"
"task_alias": "global facts"
"dataset_name": "high_school_biology"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_high_school_biology"
"task_alias": "high school biology"
"dataset_name": "high_school_chemistry"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_high_school_chemistry"
"task_alias": "high school chemistry"
"dataset_name": "high_school_computer_science"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_high_school_computer_science"
"task_alias": "high school computer science"
"dataset_name": "high_school_european_history"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_high_school_european_history"
"task_alias": "high school european history"
"dataset_name": "high_school_geography"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_social_sciences_tasks"
"task": "mmlu_cot_llama_high_school_geography"
"task_alias": "high school geography"
"dataset_name": "high_school_government_and_politics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_social_sciences_tasks"
"task": "mmlu_cot_llama_high_school_government_and_politics"
"task_alias": "high school government and politics"
"dataset_name": "high_school_macroeconomics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_social_sciences_tasks"
"task": "mmlu_cot_llama_high_school_macroeconomics"
"task_alias": "high school macroeconomics"
"dataset_name": "high_school_mathematics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_high_school_mathematics"
"task_alias": "high school mathematics"
"dataset_name": "high_school_microeconomics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_social_sciences_tasks"
"task": "mmlu_cot_llama_high_school_microeconomics"
"task_alias": "high school microeconomics"
"dataset_name": "high_school_physics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_high_school_physics"
"task_alias": "high school physics"
"dataset_name": "high_school_psychology"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_social_sciences_tasks"
"task": "mmlu_cot_llama_high_school_psychology"
"task_alias": "high school psychology"
"dataset_name": "high_school_statistics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_high_school_statistics"
"task_alias": "high school statistics"
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment