comment on padding method for encoder

fd33fb97 · Benjamin Fattori · lintangsutawika · 26a9a445 · fd33fb97
Commit fd33fb97 authored Jun 11, 2023 by Benjamin Fattori Committed by lintangsutawika Jun 22, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 1 deletion

lm_eval/models/seq2seq.py lm_eval/models/seq2seq.py +2 -1

No files found.
--- a/lm_eval/models/seq2seq.py
+++ b/lm_eval/models/seq2seq.py
@@ -186,11 +186,12 @@ class Seq2SeqHFLM(LM):
                )
            )
+            #TODO: Right now, we pass single EOT token to the Encoder and the full context to the decoder
            rolling_token_windows = [(None,) + x for x in rolling_token_windows]
            pad_amnt = 0
            if self.world_size > 1:
-                # TODO: Comment on what we do here
+                # We pad out the external document-level iterator so the inner iterator doesn't hang
                mytensor = torch.tensor(len(rolling_token_windows), device=self.device)
                gathered = (
                    self.accelerator.gather(mytensor).cpu().detach().numpy().tolist()