Add MultipleChoiceTask

706cb53a · Leo Gao · 2a1d7d87 · 706cb53a
Commit 706cb53a authored Feb 04, 2021 by Leo Gao
Hide whitespace changes
Inline Side-by-side

Showing with 29 additions and 0 deletions

lm_eval/base.py lm_eval/base.py +29 -0

No files found.
--- a/lm_eval/base.py
+++ b/lm_eval/base.py
@@ -180,6 +180,35 @@ class Task(abc.ABC):
        return description + labeled_examples + example


+class MultipleChoiceTask(Task):
+    def construct_requests(self, doc, ctx):
+        lls = [
+            rf.loglikelihood(ctx, " {}".format(choice))[0]
+            for choice in doc['choices']
+        ]
+
+        return lls
+
+    def process_results(self, doc, results):
+        gold = doc["gold"]
+
+        acc = 1. if np.argmax(results) == gold else 0.
+
+        return {
+            "acc": acc
+        }
+    
+    def higher_is_better(self):
+        return {
+            "acc": True
+        }
+    
+    def aggregation(self):
+        return {
+            "acc": mean
+        }
+
+
 def mean(arr):
    return sum(arr) / len(arr)