Unverified Commit 9822b06e authored by Lintang Sutawika's avatar Lintang Sutawika Committed by GitHub
Browse files

Merge branch 'main' into weight_by_size

parents 51f27158 b177c82c
dataset_name: food_processing
include: _hard_kmmlu_yaml
task: kmmlu_hard_food_processing
dataset_name: gas_technology_and_engineering
include: _hard_kmmlu_yaml
task: kmmlu_hard_gas_technology_and_engineering
dataset_name: geomatics
include: _hard_kmmlu_yaml
task: kmmlu_hard_geomatics
dataset_name: health
include: _hard_kmmlu_yaml
task: kmmlu_hard_health
dataset_name: industrial_engineer
include: _hard_kmmlu_yaml
task: kmmlu_hard_industrial_engineer
dataset_name: information_technology
include: _hard_kmmlu_yaml
task: kmmlu_hard_information_technology
dataset_name: interior_architecture_and_design
include: _hard_kmmlu_yaml
task: kmmlu_hard_interior_architecture_and_design
dataset_name: korean_history
include: _hard_kmmlu_yaml
task: kmmlu_hard_korean_history
dataset_name: law
include: _hard_kmmlu_yaml
task: kmmlu_hard_law
dataset_name: machine_design_and_manufacturing
include: _hard_kmmlu_yaml
task: kmmlu_hard_machine_design_and_manufacturing
dataset_name: management
include: _hard_kmmlu_yaml
task: kmmlu_hard_management
dataset_name: maritime_engineering
include: _hard_kmmlu_yaml
task: kmmlu_hard_maritime_engineering
dataset_name: marketing
include: _hard_kmmlu_yaml
task: kmmlu_hard_marketing
dataset_name: materials_engineering
include: _hard_kmmlu_yaml
task: kmmlu_hard_materials_engineering
dataset_name: math
include: _hard_kmmlu_yaml
task: kmmlu_hard_math
dataset_name: mechanical_engineering
include: _hard_kmmlu_yaml
task: kmmlu_hard_mechanical_engineering
dataset_name: nondestructive_testing
include: _hard_kmmlu_yaml
task: kmmlu_hard_nondestructive_testing
dataset_name: patent
include: _hard_kmmlu_yaml
task: kmmlu_hard_patent
dataset_name: political_science_and_sociology
include: _hard_kmmlu_yaml
task: kmmlu_hard_political_science_and_sociology
dataset_name: psychology
include: _hard_kmmlu_yaml
task: kmmlu_hard_psychology
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment