"git@developer.sourcefind.cn:dadigang/Ventoy.git" did not exist on "1065a41992ccb5e9e2e77c55a67609ba7d0c4d1a"
Commit 1c507995 authored by thomwolf's avatar thomwolf
Browse files

simpler distilbert mask - fix tf tests

parent 58b302ca
......@@ -159,8 +159,6 @@ class MultiHeadSelfAttention(nn.Module):
dim_per_head = self.dim // self.n_heads
assert 2 <= mask.dim() <= 3
causal = (mask.dim() == 3)
mask_reshp = (bs, 1, 1, k_length)
def shape(x):
......
......@@ -226,9 +226,6 @@ class TFMultiHeadSelfAttention(tf.keras.layers.Layer):
dim_per_head = self.dim // self.n_heads
mask_shape = shape_list(mask)
assert 2 <= len(mask_shape) <= 3
causal = (mask_shape) == 3)
mask_reshape = [bs, 1, 1, k_length]
def shape(x):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment