Commit 4b26fd42 authored by zhuwenwen's avatar zhuwenwen
Browse files

skip is_v32

parent 241ea5cd
......@@ -410,8 +410,8 @@ class DeepseekV32ForCausalLM(VerifyAndUpdateConfig):
hf_config = vllm_config.model_config.hf_config
# Mirror the check in vllm/model_executor/models/deepseek_v2.py
is_v32 = hasattr(hf_config, "index_topk")
assert is_v32
# is_v32 = hasattr(hf_config, "index_topk")
# assert is_v32
# For DeepSeekV3.2, we use a custom fp8 format as default (i.e.
# "auto")
......
......@@ -54,7 +54,8 @@ class DeepSeekMultiTokenPredictorLayer(nn.Module):
config.hidden_size,
bias=False)
self.is_v32 = hasattr(config, "index_topk")
# self.is_v32 = hasattr(config, "index_topk")
self.is_v32 = False
if self.is_v32:
topk_tokens = config.index_topk
topk_indices_buffer = torch.empty(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment