remove winograd_schema task type fully

2bd45fd9 · haileyschoelkopf · 80358e5a · 2bd45fd9 · 2bd45fd9
Commit 2bd45fd9 authored Jul 18, 2023 by haileyschoelkopf
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 5 deletions

lm_eval/api/registry.py lm_eval/api/registry.py +0 -1

lm_eval/evaluator.py lm_eval/evaluator.py +1 -4

No files found.
--- a/lm_eval/api/registry.py
+++ b/lm_eval/api/registry.py
@@ -80,7 +80,6 @@ DEFAULT_METRIC_REGISTRY = {
    ],
    "loglikelihood_rolling": ["word_perplexity", "byte_perplexity", "bits_per_byte"],
    "multiple_choice": ["acc", "acc_norm"],
-    "winograd_schema": ["acc"],
    "greedy_until": ["exact_match"],
 }


--- a/lm_eval/evaluator.py
+++ b/lm_eval/evaluator.py
@@ -223,10 +223,7 @@ def evaluate(
        # aggregate Instances by LM method requested to get output.
        reqtype = (
            "loglikelihood"
-            if (
-                task.OUTPUT_TYPE == "multiple_choice"
-                or task.OUTPUT_TYPE == "winograd_schema"
-            )
+            if task.OUTPUT_TYPE == "multiple_choice"
            else task.OUTPUT_TYPE
        )  # TODO: this is hacky, fix in task.py
        requests[reqtype].extend(task.instances)