Fix in gather for SM distributed

4e0410e9 · Sylvain Gugger · 367c2ef5 · 4e0410e9
Commit 4e0410e9 authored Sep 27, 2021 by Sylvain Gugger
Show whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

src/transformers/trainer_pt_utils.py src/transformers/trainer_pt_utils.py +1 -1

No files found.
--- a/src/transformers/trainer_pt_utils.py
+++ b/src/transformers/trainer_pt_utils.py
@@ -162,8 +162,8 @@ def distributed_concat(tensor: Any, num_total_examples: Optional[int] = None) ->
        if isinstance(tensor, (tuple, list)):
            return type(tensor)(distributed_concat(t, num_total_examples) for t in tensor)
        output_tensors = [tensor.clone() for _ in range(dist.get_world_size())]
-        dist.all_gather(output_tensors, tensor)
        output_tensors = [t if len(t.shape) > 0 else t[None] for t in output_tensors]
+        dist.all_gather(output_tensors, tensor)
        concat = torch.cat(output_tensors, dim=0)

        # truncate the dummy elements added by SequentialDistributedSampler