Merge pull request #774 from EleutherAI/speedup-hellaswag

[Refactor] Speedup hellaswag context building

Merge pull request #774 from EleutherAI/speedup-hellaswag
[Refactor] Speedup hellaswag context building
4f27f0b9 · Hailey Schoelkopf · GitHub · dbf2c083 · 8189eb18 · 4f27f0b9
Unverified Commit 4f27f0b9 authored Aug 13, 2023 by Hailey Schoelkopf Committed by GitHub Aug 13, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 27 additions and 2 deletions

lm_eval/tasks/hellaswag/hellaswag.yaml lm_eval/tasks/hellaswag/hellaswag.yaml +3 -2

lm_eval/tasks/hellaswag/utils.py lm_eval/tasks/hellaswag/utils.py +24 -0

No files found.
--- a/lm_eval/tasks/hellaswag/hellaswag.yaml
+++ b/lm_eval/tasks/hellaswag/hellaswag.yaml
@@ -7,9 +7,10 @@ output_type: multiple_choice
 training_split: train
 validation_split: validation
 test_split: null
-doc_to_text: "{% set text = activity_label ~ ': ' ~ ctx_a ~ ' ' ~ ctx_b.capitalize() %}{{text|trim|replace(' [title]', '. ')|regex_replace('\\[.*?\\]', '')|replace('  ', ' ')}}"
+process_docs: !function utils.process_docs
+doc_to_text: "{{query}}"
 doc_to_target: "{{label}}"
-doc_to_choice: "{{endings|map('trim')|map('replace', ' [title]', '. ')|map('regex_replace', '\\[.*?\\]', '')|map('replace', '  ', ' ')|list}}"
+doc_to_choice: "{{choices}}"
 metric_list:
  - metric: acc
    aggregation: mean

--- a/lm_eval/tasks/hellaswag/utils.py
+++ b/lm_eval/tasks/hellaswag/utils.py
+import datasets
+import re
+def preprocess(text):
+    text = text.strip()
+    # NOTE: Brackets are artifacts of the WikiHow dataset portion of HellaSwag.
+    text = text.replace(" [title]", ". ")
+    text = re.sub("\\[.*?\\]", "", text)
+    text = text.replace("  ", " ")
+    return text
+def process_docs(dataset: datasets.Dataset) -> datasets.Dataset:
+    def _process_doc(doc):
+        ctx = doc["ctx_a"] + " " + doc["ctx_b"].capitalize()
+        out_doc = {
+            "query": preprocess(doc["activity_label"] + ": " + ctx),
+            "choices": [preprocess(ending) for ending in doc["endings"]],
+            "gold": int(doc["label"]),
+        }
+        return out_doc
+    return dataset.map(_process_doc)