Commit 9aabf7e7 authored by laibao's avatar laibao
Browse files

feat(deepseek-mla):: 精简 fused RMS-RoPE concat 可用性判断

parent cae53e46
...@@ -2216,17 +2216,8 @@ class MLACommonImpl(MLACommonBaseImpl[M], Generic[M]): ...@@ -2216,17 +2216,8 @@ class MLACommonImpl(MLACommonBaseImpl[M], Generic[M]):
if kv_cache_dtype_str not in ("fp16", "bf16"): if kv_cache_dtype_str not in ("fp16", "bf16"):
use_fused_rms_rope_concat = False use_fused_rms_rope_concat = False
fused_inputs_provided = (
q_ori is not None
or key_normed is not None
or positions is not None
or weight is not None
or cos_sin_cache is not None
or epsilon is not None
)
if ( if (
envs.VLLM_USE_LIGHTOP_RMS_ROPE_CONCAT envs.VLLM_USE_LIGHTOP_RMS_ROPE_CONCAT
and fused_inputs_provided
and not use_fused_rms_rope_concat and not use_fused_rms_rope_concat
): ):
raise RuntimeError( raise RuntimeError(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment