moved to a new dir

f4813cfc · lintangsutawika · dbf2c083 · f4813cfc · f4813cfc · f4813cfc
Commit f4813cfc authored Aug 13, 2023 by lintangsutawika
5 changed files
--- a/lm_eval/benchmarks/__init__.py
+++ b/lm_eval/benchmarks/__init__.py
+import os
+import yaml
+from lm_eval import utils
+from lm_eval.tasks import register_configurable_task, check_prompt_config
+from lm_eval.logger import eval_logger
+from lm_eval.api.registry import (
+    TASK_REGISTRY,
+    GROUP_REGISTRY,
+    ALL_TASKS,
+)
+def include_benchmarks(task_dir):
+    for root, subdirs, file_list in os.walk(task_dir):
+        if (subdirs == [] or subdirs == ["__pycache__"]) and (len(file_list) > 0):
+            for f in file_list:
+                if f.endswith(".yaml"):
+                    try:
+                        benchmark_path = os.path.join(root, f)
+                        with open(benchmark_path, "rb") as file:
+                            yaml_config = yaml.full_load(file)
+                        assert "group" in yaml_config
+                        group = yaml_config["group"]
+                        all_task_list = yaml_config["task"]
+                        config_list = [
+                            task for task in all_task_list if type(task) != str
+                        ]
+                        task_list = [
+                            task for task in all_task_list if type(task) == str
+                        ]
+                        for task_config in config_list:
+                            var_configs = check_prompt_config(
+                                {
+                                    **task_config,
+                                    **{"group": group},
+                                }
+                            )
+                            for config in var_configs:
+                                register_configurable_task(config)
+                        task_names = utils.pattern_match(task_list, ALL_TASKS)
+                        for task in task_names:
+                            if task in TASK_REGISTRY:
+                                if group in GROUP_REGISTRY:
+                                    GROUP_REGISTRY[group].append(task)
+                                else:
+                                    GROUP_REGISTRY[group] = [task]
+                                    ALL_TASKS.add(group)
+                    except Exception as error:
+                        eval_logger.warning(
+                            "Failed to load benchmark in\n"
+                            f"                                 {benchmark_path}\n"
+                            "                                 Benchmark will not be added to registry\n"
+                            f"                                 Error: {error}"
+                        )
+task_dir = os.path.dirname(os.path.abspath(__file__)) + "/"
+include_benchmarks(task_dir)
\ No newline at end of file
--- a/lm_eval/tasks/benchmarks/pythia.yaml
+++ b/lm_eval/tasks/benchmarks/pythia.yaml
--- a/lm_eval/tasks/benchmarks/t0_eval.yaml
+++ b/lm_eval/tasks/benchmarks/t0_eval.yaml
--- a/lm_eval/evaluator.py
+++ b/lm_eval/evaluator.py
@@ -11,6 +11,7 @@ import numpy as np
 import lm_eval.api
 import lm_eval.tasks
+import lm_eval.benchmarks
 import lm_eval.models
 import lm_eval.api.metrics
 import lm_eval.api.registry

--- a/lm_eval/tasks/__init__.py
+++ b/lm_eval/tasks/__init__.py
@@ -98,58 +98,58 @@ def include_task_folder(task_dir):
                        )
-def include_benchmarks(task_dir, benchmark_dir="benchmarks"):
+# def include_benchmarks(task_dir, benchmark_dir="benchmarks"):
-    for root, subdirs, file_list in os.walk(os.path.join(task_dir, benchmark_dir)):
+#     for root, subdirs, file_list in os.walk(os.path.join(task_dir, benchmark_dir)):
-        if (subdirs == [] or subdirs == ["__pycache__"]) and (len(file_list) > 0):
+#         if (subdirs == [] or subdirs == ["__pycache__"]) and (len(file_list) > 0):
-            for f in file_list:
+#             for f in file_list:
-                if f.endswith(".yaml"):
+#                 if f.endswith(".yaml"):
-                    try:
+#                     try:
-                        benchmark_path = os.path.join(root, f)
+#                         benchmark_path = os.path.join(root, f)
-                        with open(benchmark_path, "rb") as file:
+#                         with open(benchmark_path, "rb") as file:
-                            yaml_config = yaml.full_load(file)
+#                             yaml_config = yaml.full_load(file)
-                        assert "group" in yaml_config
+#                         assert "group" in yaml_config
-                        group = yaml_config["group"]
+#                         group = yaml_config["group"]
-                        all_task_list = yaml_config["task"]
+#                         all_task_list = yaml_config["task"]
-                        config_list = [
+#                         config_list = [
-                            task for task in all_task_list if type(task) != str
+#                             task for task in all_task_list if type(task) != str
-                        ]
+#                         ]
-                        task_list = [
+#                         task_list = [
-                            task for task in all_task_list if type(task) == str
+#                             task for task in all_task_list if type(task) == str
-                        ]
+#                         ]
-                        for task_config in config_list:
+#                         for task_config in config_list:
-                            var_configs = check_prompt_config(
+#                             var_configs = check_prompt_config(
-                                {
+#                                 {
-                                    **task_config,
+#                                     **task_config,
-                                    **{"group": group},
+#                                     **{"group": group},
-                                }
+#                                 }
-                            )
+#                             )
-                            for config in var_configs:
+#                             for config in var_configs:
-                                register_configurable_task(config)
+#                                 register_configurable_task(config)
-                        task_names = utils.pattern_match(task_list, ALL_TASKS)
+#                         task_names = utils.pattern_match(task_list, ALL_TASKS)
-                        for task in task_names:
+#                         for task in task_names:
-                            if task in TASK_REGISTRY:
+#                             if task in TASK_REGISTRY:
-                                if group in GROUP_REGISTRY:
+#                                 if group in GROUP_REGISTRY:
-                                    GROUP_REGISTRY[group].append(task)
+#                                     GROUP_REGISTRY[group].append(task)
-                                else:
+#                                 else:
-                                    GROUP_REGISTRY[group] = [task]
+#                                     GROUP_REGISTRY[group] = [task]
-                                    ALL_TASKS.add(group)
+#                                     ALL_TASKS.add(group)
-                    except Exception as error:
+#                     except Exception as error:
-                        eval_logger.warning(
+#                         eval_logger.warning(
-                            "Failed to load benchmark in\n"
+#                             "Failed to load benchmark in\n"
-                            f"                                 {benchmark_path}\n"
+#                             f"                                 {benchmark_path}\n"
-                            "                                 Benchmark will not be added to registry\n"
+#                             "                                 Benchmark will not be added to registry\n"
-                            f"                                 Error: {error}"
+#                             f"                                 Error: {error}"
-                        )
+#                         )
 task_dir = os.path.dirname(os.path.abspath(__file__)) + "/"
 include_task_folder(task_dir)
-include_benchmarks(task_dir)
+# include_benchmarks(task_dir)
 def get_task(task_name, config):