test

2a67a469 · baberabb · acf73a04 · 2a67a469 · 2a67a469 · 2a67a469
Commit 2a67a469 authored Dec 28, 2023 by baberabb
Showing with 36 additions and 4 deletions

lm_eval/tasks/arc/arc_challenge.yaml lm_eval/tasks/arc/arc_challenge.yaml +0 -1

lm_eval/tasks/arc/arc_easy.yaml lm_eval/tasks/arc/arc_easy.yaml +0 -1

scripts/make_table_tasks.py scripts/make_table_tasks.py +36 -2

No files found.
--- a/lm_eval/tasks/arc/arc_challenge.yaml
+++ b/lm_eval/tasks/arc/arc_challenge.yaml
 include: arc_easy.yaml
 task: arc_challenge
-# test
 dataset_name: ARC-Challenge
--- a/lm_eval/tasks/arc/arc_easy.yaml
+++ b/lm_eval/tasks/arc/arc_easy.yaml
@@ -3,7 +3,6 @@ group:
 task: arc_easy
 dataset_path: ai2_arc
 dataset_name: ARC-Easy
-# test
 output_type: multiple_choice
 training_split: train
 validation_split: validation

--- a/scripts/make_table_tasks.py
+++ b/scripts/make_table_tasks.py
@@ -3,15 +3,16 @@ Usage:
   Writes csv and Markdown table to csv_file, md_file (below).
 """
 import logging
+import os
 from pathlib import Path
+from typing import List, Union
 import datasets
 import pandas as pd
 from lm_eval import tasks
 from lm_eval.tasks import TASK_REGISTRY
+from lm_eval.utils import load_yaml_config
-from ..tests.utils import new_tasks
 logging.basicConfig(level=logging.INFO)
@@ -20,6 +21,39 @@ datasets.disable_caching()
 tasks.initialize_tasks()
+def load_changed_files(file_path: str) -> List[str]:
+    with open(file_path, "r") as f:
+        content = f.read()
+        words_list = [x for x in content.split()]
+    return words_list
+def parser(full_path: List[str]) -> List[str]:
+    _output = set()
+    for x in full_path:
+        if x.endswith(".yaml"):
+            _output.add(load_yaml_config(x)["task"])
+        elif x.endswith(".py"):
+            path = [str(x) for x in (list(Path(x).parent.glob("*.yaml")))]
+            _output |= {load_yaml_config(x)["task"] for x in path}
+    return list(_output)
+def new_tasks() -> Union[List[str], None]:
+    FILENAME = ".github/outputs/tasks_all_changed_and_modified_files.txt"
+    if os.path.exists(FILENAME):
+        # If tasks folder has changed then we get the list of files from FILENAME
+        # and parse the yaml files to get the task names.
+        return parser(load_changed_files(FILENAME))
+    elif os.getenv("API") is not None:
+        # Or if API has changed then we set the ENV variable API to True
+        # and run  given tasks.
+        return ["arc_easy", "hellaswag", "piqa", "wikitext"]
+    # if both not true just do arc_easy
+    else:
+        return None
 def check(tf):
    if tf:
        return "✓"