Implement gpt2 loglikelihood

8fffd927 · Leo Gao · 31696910 · 8fffd927
Commit 8fffd927 authored Sep 06, 2020 by Leo Gao
Hide whitespace changes
Inline Side-by-side

Showing with 9 additions and 1 deletion

gpt2.py gpt2.py +9 -1

No files found.
--- a/gpt2.py
+++ b/gpt2.py
 import transformers
 from base import LM
 import torch
+import torch.nn.functional as F
 class GPT2LM(LM):
@@ -16,4 +17,11 @@ class GPT2LM(LM):
        return self.tok.decode(res[0][len(context[0]):-1]).strip()
    def loglikelihood(self, context, continuation):
-        pass
+        print('likelihood:', context, continuation)
+        inp = torch.tensor([self.tok.encode(context + continuation)], dtype=torch.long)
+        ctxlen = len(self.tok.encode(context.strip()))
+        cont_toks = inp[:, ctxlen:] # [batch, seq]
+        logits = F.log_softmax(self.gpt2(inp)[0], dim=-1)[:, ctxlen - 1:-1] # [batch, seq, vocab]
+        return torch.gather(logits, 2, cont_toks.unsqueeze(-1)).squeeze(-1)