Unverified Commit 3816796e authored by Alexandre Marques's avatar Alexandre Marques Committed by GitHub
Browse files

Adds MMLU CoT, gsm8k and arc_challenge for llama instruct (#2829)

* llama-style MMLU CoT

* Refactor MMLU CoT template YAML to simplify 'until' structure

* Add GSM8K task configuration for LLaMA3 with few-shot examples

* Fix missing newline at end of MMLU CoT YAML file

* Add ARC-Challenge task configuration and processing utility

* Add additional MMLU and ARC-Challenge task variants to README

* Update README with notes on arc_challenge_llama dataset preprocessing
parent 1514ac1e
"dataset_name": "high_school_us_history"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_high_school_us_history"
"task_alias": "high school us history"
"dataset_name": "high_school_world_history"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_high_school_world_history"
"task_alias": "high school world history"
"dataset_name": "human_aging"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_human_aging"
"task_alias": "human aging"
"dataset_name": "human_sexuality"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_social_sciences_tasks"
"task": "mmlu_cot_llama_human_sexuality"
"task_alias": "human sexuality"
"dataset_name": "international_law"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_international_law"
"task_alias": "international law"
"dataset_name": "jurisprudence"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_jurisprudence"
"task_alias": "jurisprudence"
"dataset_name": "logical_fallacies"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_logical_fallacies"
"task_alias": "logical fallacies"
"dataset_name": "machine_learning"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_stem_tasks"
"task": "mmlu_cot_llama_machine_learning"
"task_alias": "machine learning"
"dataset_name": "management"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_management"
"task_alias": "management"
"dataset_name": "marketing"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_marketing"
"task_alias": "marketing"
"dataset_name": "medical_genetics"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_medical_genetics"
"task_alias": "medical genetics"
"dataset_name": "miscellaneous"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_miscellaneous"
"task_alias": "miscellaneous"
"dataset_name": "moral_disputes"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_moral_disputes"
"task_alias": "moral disputes"
"dataset_name": "moral_scenarios"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_moral_scenarios"
"task_alias": "moral scenarios"
"dataset_name": "nutrition"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_nutrition"
"task_alias": "nutrition"
"dataset_name": "philosophy"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_philosophy"
"task_alias": "philosophy"
"dataset_name": "prehistory"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_prehistory"
"task_alias": "prehistory"
"dataset_name": "professional_accounting"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_professional_accounting"
"task_alias": "professional accounting"
"dataset_name": "professional_law"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_humanities_tasks"
"task": "mmlu_cot_llama_professional_law"
"task_alias": "professional law"
"dataset_name": "professional_medicine"
"description": ""
"include": "_mmlu_cot_llama_template_yaml"
"tag": "mmlu_cot_llama_other_tasks"
"task": "mmlu_cot_llama_professional_medicine"
"task_alias": "professional medicine"
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment