removed truncation of source

a264f449 · jeffhsu3 · 18e08d29 · a264f449 · a264f449
Commit a264f449 authored Feb 10, 2021 by jeffhsu3
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 11 deletions

lm_eval/tasks/pubmedqa.py lm_eval/tasks/pubmedqa.py +0 -4

lm_eval/tasks/qa4mre.py lm_eval/tasks/qa4mre.py +2 -7

No files found.
--- a/lm_eval/tasks/pubmedqa.py
+++ b/lm_eval/tasks/pubmedqa.py
@@ -70,8 +70,4 @@ class Pubmed_QA(HFTask):
    def higher_is_better(self):
        return {
            "acc" : True
-<<<<<<< HEAD
        }
-=======
-        }
->>>>>>> 79878d135a19846868c182aa986b6ec740e7c884
--- a/lm_eval/tasks/qa4mre.py
+++ b/lm_eval/tasks/qa4mre.py
@@ -27,9 +27,6 @@ class QA4MRE(MultipleChoiceTask):
        }
        vpath = variable_year_path[year]
        url_path = f"{base_path}{vpath}QA4MRE-{year}-{lang}_GS.xml"
-        # Should all the years be concatenated together?
-        # Separate let's us compare with results from the competition
-        # Competition also separated out by topics
        if not os.path.exists("data/qa4mre"):
            os.mkdir("data/qa4mre")
        if not os.path.isfile(f"data/qa4mre/QA4MRE-{year}-{lang}"):
@@ -59,7 +56,7 @@ class QA4MRE(MultipleChoiceTask):
        out_doc = {
            "query" : question.find('q_str').text,
            "choices": choices, 
-            "gold" : int(question.find("./answer[@correct='Yes']").attrib["a_id"])-1,
+            "gold" : int(question.find("./answer[@correct='Yes']").attrib["a_id"]) - 1,
        }
        return out_doc
    
@@ -67,14 +64,12 @@ class QA4MRE(MultipleChoiceTask):
        tree = ET.parse(textfilename)
        root = tree.getroot()
        # TODO: context is much larger than the context sometimes
-        TRUNCATE = 4000
-        # Multiple questions per document
        for reading_test in root.iter('reading-test'):
            src = reading_test[0].text
            src = src.rstrip("\n\t\t\t").replace("\'", "'")
            for qid, question in enumerate(reading_test.iter('q')):
                out_doc = self._convert_standard(question)
-                out_doc['source'] = src[:TRUNCATE]
+                out_doc['source'] = src
                yield out_doc

    def fewshot_description(self):