Commit dc675592 authored by zhuwenwen's avatar zhuwenwen
Browse files

off rotary_embedding_deepseek_fuse

parent f331f103
...@@ -958,7 +958,8 @@ class DeepseekScalingRotaryEmbedding(RotaryEmbedding): ...@@ -958,7 +958,8 @@ class DeepseekScalingRotaryEmbedding(RotaryEmbedding):
BLOCK_SIZE=BLOCK_SIZE, BLOCK_SIZE=BLOCK_SIZE,
num_warps=1) num_warps=1)
if envs.VLLM_USE_LIGHTOP: # if envs.VLLM_USE_LIGHTOP:
if False:
torch.ops.vllm.rotary_embedding_deepseek_fuse(positions, query, key, self.head_size, self.cos_sin_cache, self.is_neox_style) torch.ops.vllm.rotary_embedding_deepseek_fuse(positions, query, key, self.head_size, self.cos_sin_cache, self.is_neox_style)
else: else:
call(query) call(query)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment