Commit 006e8c6a authored by Atream's avatar Atream
Browse files

remove causal mask

parent cdb6f896
...@@ -649,9 +649,12 @@ class KDeepseekV2Model(BaseInjectedModule): ...@@ -649,9 +649,12 @@ class KDeepseekV2Model(BaseInjectedModule):
if per_layer_prefill_flag: if per_layer_prefill_flag:
causal_mask = None causal_mask = None
else: else:
causal_mask = self._update_causal_mask( if os.name == 'nt':
attention_mask, inputs_embeds, cache_position, past_key_values, output_attentions causal_mask = self._update_causal_mask(
) attention_mask, inputs_embeds, cache_position, past_key_values, output_attentions
)
else:
causal_mask = None
# embed positions # embed positions
hidden_states = inputs_embeds hidden_states = inputs_embeds
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment