Unverified Commit ded890f3 authored by Jinho Heo's avatar Jinho Heo Committed by GitHub
Browse files

Add kmmlu multiple-choice(accuracy) task (#2849)

parent febd19d8
dataset_name: Mechanical-Engineering
include: _default_kmmlu_yaml
task: kmmlu_mechanical_engineering
tag: kmmlu_stem_tasks
dataset_name: Nondestructive-Testing
include: _default_kmmlu_yaml
task: kmmlu_nondestructive_testing
tag: kmmlu_applied_science_tasks
dataset_name: Patent
include: _default_kmmlu_yaml
task: kmmlu_patent
tag: kmmlu_other_tasks
dataset_name: Political-Science-and-Sociology
include: _default_kmmlu_yaml
task: kmmlu_political_science_and_sociology
tag: kmmlu_humss_tasks
dataset_name: Psychology
include: _default_kmmlu_yaml
task: kmmlu_psychology
tag: kmmlu_humss_tasks
dataset_name: Public-Safety
include: _default_kmmlu_yaml
task: kmmlu_public_safety
tag: kmmlu_other_tasks
dataset_name: Railway-and-Automotive-Engineering
include: _default_kmmlu_yaml
task: kmmlu_railway_and_automotive_engineering
tag: kmmlu_applied_science_tasks
dataset_name: Real-Estate
include: _default_kmmlu_yaml
task: kmmlu_real_estate
tag: kmmlu_other_tasks
dataset_name: Refrigerating-Machinery
include: _default_kmmlu_yaml
task: kmmlu_refrigerating_machinery
tag: kmmlu_other_tasks
dataset_name: Social-Welfare
include: _default_kmmlu_yaml
task: kmmlu_social_welfare
tag: kmmlu_humss_tasks
dataset_name: Taxation
include: _default_kmmlu_yaml
task: kmmlu_taxation
tag: kmmlu_humss_tasks
dataset_name: Telecommunications-and-Wireless-Technology
include: _default_kmmlu_yaml
task: kmmlu_telecommunications_and_wireless_technology
tag: kmmlu_applied_science_tasks
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment