Unverified Commit 19b7acdd authored by Alessandro Suglia's avatar Alessandro Suglia Committed by GitHub
Browse files

Cloned tensors after indexing in _compute_attn_output_with_global_indices (#13613)


Co-authored-by: default avatarAlessandro Suglia <asuglia@fb.com>
parent ce32c69c
......@@ -586,7 +586,7 @@ class LEDEncoderSelfAttention(nn.Module):
# attn = torch.einsum('blhs,bshd->blhd', (selected_attn_probs, selected_v))
# compute attn output only global
attn_output_only_global = torch.matmul(
attn_probs_only_global.transpose(1, 2), value_vectors_only_global.transpose(1, 2)
attn_probs_only_global.transpose(1, 2).clone(), value_vectors_only_global.transpose(1, 2).clone()
).transpose(1, 2)
# reshape attn probs
......
......@@ -976,7 +976,7 @@ class LongformerSelfAttention(nn.Module):
# attn = torch.einsum('blhs,bshd->blhd', (selected_attn_probs, selected_v))
# compute attn output only global
attn_output_only_global = torch.matmul(
attn_probs_only_global.transpose(1, 2), value_vectors_only_global.transpose(1, 2)
attn_probs_only_global.transpose(1, 2).clone(), value_vectors_only_global.transpose(1, 2).clone()
).transpose(1, 2)
# reshape attn probs
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment