Commit 364e54d4 authored by Jonathan Tow's avatar Jonathan Tow
Browse files

Split `dev` and `val` sets and cleanup prompt spacing

parent b2bab740
...@@ -54,7 +54,7 @@ class GeneralHendrycksTest(MultipleChoiceTask): ...@@ -54,7 +54,7 @@ class GeneralHendrycksTest(MultipleChoiceTask):
return True return True
def has_validation_docs(self): def has_validation_docs(self):
return False return True
def has_test_docs(self): def has_test_docs(self):
return True return True
...@@ -69,9 +69,9 @@ class GeneralHendrycksTest(MultipleChoiceTask): ...@@ -69,9 +69,9 @@ class GeneralHendrycksTest(MultipleChoiceTask):
D. <choice4> D. <choice4>
Answer: Answer:
""" """
prompt = "Question: " + doc[0] prompt = "Question: " + doc[0] + "\n"
prompt += " ".join([f"\n{choices[j]}. {doc[j+1]}" for j in range(4)]) prompt += "".join([f"{choices[j]}. {doc[j+1]}\n" for j in range(4)])
prompt += "\nAnswer:" prompt += "Answer:"
return prompt return prompt
choices = ['A', 'B', 'C', 'D'] choices = ['A', 'B', 'C', 'D']
return { return {
...@@ -85,16 +85,12 @@ class GeneralHendrycksTest(MultipleChoiceTask): ...@@ -85,16 +85,12 @@ class GeneralHendrycksTest(MultipleChoiceTask):
return (self._convert_standard(doc) for doc in reader) return (self._convert_standard(doc) for doc in reader)
def training_docs(self): def training_docs(self):
# Use all files in the auxiliary_train, dev, val directories filename = self.DATASET_PATH / "dev" / f"{self.subject}_dev.csv"
# auxiliary_train includes some UnifiedQA MC tasks return self._load_docs(filename)
docs = []
for train_dir in ["auxiliary_train", "dev", "val"]:
for f in (self.DATASET_PATH / train_dir).iterdir():
docs.extend(self._load_docs(f))
return docs
def validation_docs(self): def validation_docs(self):
raise NotImplementedError filename = self.DATASET_PATH / "val" / f"{self.subject}_val.csv"
return self._load_docs(filename)
def test_docs(self): def test_docs(self):
filename = self.DATASET_PATH / "test" / f"{self.subject}_test.csv" filename = self.DATASET_PATH / "test" / f"{self.subject}_test.csv"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment