Commit 23b7138a authored by thomwolf's avatar thomwolf
Browse files

fix #1378 and #1453

parent d688af19
...@@ -226,8 +226,9 @@ class TFMultiHeadSelfAttention(tf.keras.layers.Layer): ...@@ -226,8 +226,9 @@ class TFMultiHeadSelfAttention(tf.keras.layers.Layer):
dim_per_head = self.dim // self.n_heads dim_per_head = self.dim // self.n_heads
assert 2 <= len(tf.shape(mask)) <= 3 mask_shape = shape_list(mask)
causal = (len(tf.shape(mask)) == 3) assert 2 <= len(mask_shape) <= 3
causal = (mask_shape) == 3)
mask_reshape = [bs, 1, 1, k_length] mask_reshape = [bs, 1, 1, k_length]
def shape(x): def shape(x):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment