Commit d73be361 authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge branch 'v0.9.2-dev-bmm-2cd-0206-rebase-newest' into 'v0.9.2-dev'

去掉DTBmm的一个冗余条件

See merge request dcutoolkit/deeplearing/vllm!416
parents a1f5ce6e 8b6ef0da
...@@ -936,7 +936,6 @@ class MLACommonImpl(MLAAttentionImpl[M], Generic[M]): ...@@ -936,7 +936,6 @@ class MLACommonImpl(MLAAttentionImpl[M], Generic[M]):
def enable_fused_DTBmm(self): def enable_fused_DTBmm(self):
if envs.VLLM_USE_FUSED_DTBMM and \ if envs.VLLM_USE_FUSED_DTBMM and \
self.kv_cache_dtype == "fp8_e4m3" and \
torch.cuda.get_device_properties("cuda").gcnArchName.split(':')[0] == "gfx938": torch.cuda.get_device_properties("cuda").gcnArchName.split(':')[0] == "gfx938":
return True return True
else: else:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment