Commit 364e54d4 authored by Jonathan Tow's avatar Jonathan Tow
Browse files

Split `dev` and `val` sets and cleanup prompt spacing

parent b2bab740
......@@ -54,7 +54,7 @@ class GeneralHendrycksTest(MultipleChoiceTask):
return True
def has_validation_docs(self):
return False
return True
def has_test_docs(self):
return True
......@@ -69,9 +69,9 @@ class GeneralHendrycksTest(MultipleChoiceTask):
D. <choice4>
Answer:
"""
prompt = "Question: " + doc[0]
prompt += " ".join([f"\n{choices[j]}. {doc[j+1]}" for j in range(4)])
prompt += "\nAnswer:"
prompt = "Question: " + doc[0] + "\n"
prompt += "".join([f"{choices[j]}. {doc[j+1]}\n" for j in range(4)])
prompt += "Answer:"
return prompt
choices = ['A', 'B', 'C', 'D']
return {
......@@ -85,16 +85,12 @@ class GeneralHendrycksTest(MultipleChoiceTask):
return (self._convert_standard(doc) for doc in reader)
def training_docs(self):
# Use all files in the auxiliary_train, dev, val directories
# auxiliary_train includes some UnifiedQA MC tasks
docs = []
for train_dir in ["auxiliary_train", "dev", "val"]:
for f in (self.DATASET_PATH / train_dir).iterdir():
docs.extend(self._load_docs(f))
return docs
filename = self.DATASET_PATH / "dev" / f"{self.subject}_dev.csv"
return self._load_docs(filename)
def validation_docs(self):
raise NotImplementedError
filename = self.DATASET_PATH / "val" / f"{self.subject}_val.csv"
return self._load_docs(filename)
def test_docs(self):
filename = self.DATASET_PATH / "test" / f"{self.subject}_test.csv"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment