Fix

96157fc7 · Leo Gao · c3f724cf · 96157fc7 · 96157fc7 · 96157fc7
Commit 96157fc7 authored Feb 08, 2021 by Leo Gao
Hide whitespace changes
Inline Side-by-side

Showing with 14 additions and 13 deletions

lm_eval/tasks/glue.py lm_eval/tasks/glue.py +11 -11

lm_eval/tasks/superglue.py lm_eval/tasks/superglue.py +2 -1

lm_eval/utils.py lm_eval/utils.py +1 -1

No files found.
--- a/lm_eval/tasks/glue.py
+++ b/lm_eval/tasks/glue.py
@@ -68,19 +68,19 @@ class SST(HFTask):
        return True

    def fewshot_description(self):
-        return "Indicate if each sentence is Positive or Negative."
+        return "Indicate if the sentiment of each sentence is positive or negative."

    def doc_to_text(self, doc):
-        return "{}\nQuestion: Is this sentence Positive or Negative?\nAnswer:".format(
+        return "{}\nQuestion: Is this sentence positive or negative?\nAnswer:".format(
            general_detokenize(doc["sentence"]),
        )

    def doc_to_target(self, doc):
-        return " {}".format({1: "Positive", 0: "Negative"}[doc["label"]])
+        return " {}".format({1: "positive", 0: "negative"}[doc["label"]])

    def construct_requests(self, doc, ctx):
-        ll_positive, _ = rf.loglikelihood(ctx, " Positive")
-        ll_negative, _ = rf.loglikelihood(ctx, " Negative")
+        ll_positive, _ = rf.loglikelihood(ctx, " positive")
+        ll_negative, _ = rf.loglikelihood(ctx, " negative")
        return ll_positive, ll_negative

    def process_results(self, doc, results):
@@ -129,7 +129,7 @@ class MNLI(HFTask):
    def doc_to_text(self, doc):
        return "{}\nQuestion: {} True, False or Neither?\nAnswer:".format(
            doc["premise"],
-            doc["hypothesis"] + ('' if doc["hypothesis"].endswith('.') else '.'),
+            doc["hypothesis"].strip() + ('' if doc["hypothesis"].strip().endswith('.') else '.'),
        )

    def doc_to_target(self, doc):
@@ -195,11 +195,11 @@ class QNLI(HFTask):
    def doc_to_target(self, doc):
        # True = entailment
        # False = not entailment
-        return " {}".format({0: "Yes", 1: "No"}[doc["label"]])
+        return " {}".format({0: "yes", 1: "no"}[doc["label"]])

    def construct_requests(self, doc, ctx):
-        ll_yes, _ = rf.loglikelihood(ctx, " Yes")
-        ll_no, _ = rf.loglikelihood(ctx, " No")
+        ll_yes, _ = rf.loglikelihood(ctx, " yes")
+        ll_no, _ = rf.loglikelihood(ctx, " no")
        return ll_yes, ll_no

    def process_results(self, doc, results):
@@ -347,8 +347,8 @@ class MRPC(HFTask):
        return " {}".format(yesno(doc["label"]))

    def construct_requests(self, doc, ctx):
-        ll_yes, _ = rf.loglikelihood(ctx, " Yes")
-        ll_no, _ = rf.loglikelihood(ctx, " No")
+        ll_yes, _ = rf.loglikelihood(ctx, " yes")
+        ll_no, _ = rf.loglikelihood(ctx, " no")
        return ll_yes, ll_no

    def process_results(self, doc, results):

--- a/lm_eval/tasks/superglue.py
+++ b/lm_eval/tasks/superglue.py
@@ -8,6 +8,7 @@ from . common import HFTask, yesno
 from lm_eval.base import rf, mean, acc_all, metric_max_over_ground_truths
 import sklearn
 import transformers.data.metrics.squad_metrics as squad_metrics
+from ..utils import general_detokenize


 class BoolQ(HFTask):
@@ -221,7 +222,7 @@ class MultiRC(HFTask):

    @staticmethod
    def format_answer(answer, label):
-        label_str = "Yes" if label else "No"
+        label_str = "yes" if label else "no"
        return f"{label_str}, {answer}"

    def construct_requests(self, doc, ctx):

--- a/lm_eval/utils.py
+++ b/lm_eval/utils.py
@@ -48,5 +48,5 @@ def general_detokenize(string):
    string = string.replace("( ", "(")
    string = string.replace("\" ", "\"")
    string = string.replace(" \"", "\"")
-    string = re.sub(r" (['.,])", r"\1")
+    string = re.sub(r" (['.,])", r"\1", string)
    return string
\ No newline at end of file