Commit bc5478a1 authored by Leo Gao's avatar Leo Gao
Browse files

Minor updates

parent c971fa82
...@@ -18,7 +18,7 @@ class GPT2LM(LM): ...@@ -18,7 +18,7 @@ class GPT2LM(LM):
self.gpt2.eval() self.gpt2.eval()
# pretrained tokenizer for neo is broken for now so just hardcoding this to gpt2 # pretrained tokenizer for neo is broken for now so just hardcoding this to gpt2
self.tokenizer = transformers.AutoTokenizer.from_pretrained('gpt2') self.tokenizer = transformers.GPT2TokenizerFast.from_pretrained('gpt2')
self.tokenizer.pad_token = "<|endoftext|>" self.tokenizer.pad_token = "<|endoftext|>"
self.max_length = self.gpt2.config.n_ctx self.max_length = self.gpt2.config.n_ctx
......
...@@ -44,7 +44,7 @@ class GeneralHendrycksTest(MultipleChoiceTask): ...@@ -44,7 +44,7 @@ class GeneralHendrycksTest(MultipleChoiceTask):
if not self.DATASET_PATH.exists(): if not self.DATASET_PATH.exists():
sh(""" sh("""
mkdir -p data mkdir -p data
wget https://people.eecs.berkeley.edu/~hendrycks/data.tar -P data/ wget -c https://people.eecs.berkeley.edu/~hendrycks/data.tar -P data/
tar -xf data/data.tar -C data/ tar -xf data/data.tar -C data/
rm data/data.tar rm data/data.tar
mv data/data data/hendrycksTest mv data/data data/hendrycksTest
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment