Unverified Commit 7cd004c4 authored by Zehan Li's avatar Zehan Li Committed by GitHub
Browse files

add multilingual mmlu eval (#1484)

parent 5ccd65d4
......@@ -6,17 +6,7 @@ from tqdm import tqdm
def main() -> None:
dataset_path = "alexandrainst/m_mmlu"
# Removed hy and sk subdataset because the original dataset is broken
# I created this PR https://huggingface.co/datasets/alexandrainst/m_mmlu/discussions/3
# on the dataset for the authors, in case it will be accepeted the filter can be removed
keys_without_hy_sk = list( # noqa: F841
filter(
lambda k: ("hy" not in k and "sk" not in k),
datasets.get_dataset_infos(dataset_path).keys(),
)
)
for task in tqdm():
for task in tqdm(datasets.get_dataset_infos(dataset_path).keys()):
file_name = f"m_mmlu_{task}.yaml"
try:
with open(f"{file_name}", "w") as f:
......
# Generated by _generate_configs.py
dataset_name: hy
include: _default_yaml
task: m_mmlu_hy
# Generated by _generate_configs.py
dataset_name: sk
include: _default_yaml
task: m_mmlu_sk
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment