Unverified Commit 9822b06e authored by Lintang Sutawika's avatar Lintang Sutawika Committed by GitHub
Browse files

Merge branch 'main' into weight_by_size

parents 51f27158 b177c82c
dataset_name: telecommunications_and_wireless_technology
include: _direct_hard_kmmlu_yaml
task: kmmlu_hard_direct_telecommunications_and_wireless_technology
group: kmmlu
dataset_path: HAERAE-HUB/K-MMLU-Preview
group:
- kmmlu
- kmmlu_hard
dataset_path: HAERAE-HUB/KMMLU-HARD
output_type: multiple_choice
training_split: train
validation_split: dev
test_split: test
fewshot_split: dev
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{A}}\nB. {{B}}\nC. {{C}}\nD. {{D}}\n정답:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: "{{['A', 'B', 'C', 'D'][answer-1]}}"
doc_to_target: "{{answer-1}}"
metric_list:
- metric: acc
aggregation: mean
......@@ -17,4 +16,4 @@ metric_list:
aggregation: mean
higher_is_better: true
metadata:
version: 1.1
version: 2.0
dataset_name: accounting
include: _hard_kmmlu_yaml
task: kmmlu_hard_accounting
dataset_name: agricultural_sciences
include: _hard_kmmlu_yaml
task: kmmlu_hard_agricultural_sciences
dataset_name: aviation_engineering_and_maintenance
include: _hard_kmmlu_yaml
task: kmmlu_hard_aviation_engineering_and_maintenance
dataset_name: biology
include: _hard_kmmlu_yaml
task: kmmlu_hard_biology
dataset_name: chemical_engineering
include: _hard_kmmlu_yaml
task: kmmlu_hard_chemical_engineering
dataset_name: chemistry
include: _hard_kmmlu_yaml
task: kmmlu_hard_chemistry
dataset_name: civil_engineering
include: _hard_kmmlu_yaml
task: kmmlu_hard_civil_engineering
dataset_name: computer_science
include: _hard_kmmlu_yaml
task: kmmlu_hard_computer_science
dataset_name: construction
include: _hard_kmmlu_yaml
task: kmmlu_hard_construction
dataset_name: criminal_law
include: _hard_kmmlu_yaml
task: kmmlu_hard_criminal_law
dataset_name: ecology
include: _hard_kmmlu_yaml
task: kmmlu_hard_ecology
dataset_name: economics
include: _hard_kmmlu_yaml
task: kmmlu_hard_economics
dataset_name: education
include: _hard_kmmlu_yaml
task: kmmlu_hard_education
dataset_name: electrical_engineering
include: _hard_kmmlu_yaml
task: kmmlu_hard_electrical_engineering
dataset_name: electronics_engineering
include: _hard_kmmlu_yaml
task: kmmlu_hard_electronics_engineering
dataset_name: energy_management
include: _hard_kmmlu_yaml
task: kmmlu_hard_energy_management
dataset_name: environmental_science
include: _hard_kmmlu_yaml
task: kmmlu_hard_environmental_science
dataset_name: fashion
include: _hard_kmmlu_yaml
task: kmmlu_hard_fashion
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment