Unverified Commit eaeca3cd authored by yyzxw's avatar yyzxw Committed by GitHub
Browse files

[Bugfix] Parse SpeculativeConfig Error (#25142)


Signed-off-by: default avatarzxw <1020938856@qq.com>
Signed-off-by: default avatarHarry Mellor <19981378+hmellor@users.noreply.github.com>
Co-authored-by: default avatarHarry Mellor <19981378+hmellor@users.noreply.github.com>
parent 12c1287d
...@@ -1465,12 +1465,18 @@ class EngineArgs: ...@@ -1465,12 +1465,18 @@ class EngineArgs:
return False return False
# V1 supports N-gram, Medusa, and Eagle speculative decoding. # V1 supports N-gram, Medusa, and Eagle speculative decoding.
if (self.speculative_config is not None if self.speculative_config is not None:
and self.speculative_config.get("method") == "draft_model"): # speculative_config could still be a dict at this point
raise NotImplementedError( if isinstance(self.speculative_config, dict):
"Speculative decoding with draft model is not supported yet. " method = self.speculative_config.get("method", None)
"Please consider using other speculative decoding methods " else:
"such as ngram, medusa, eagle, or deepseek_mtp.") method = self.speculative_config.method
if method == "draft_model":
raise NotImplementedError(
"Draft model speculative decoding is not supported yet. "
"Please consider using other speculative decoding methods "
"such as ngram, medusa, eagle, or deepseek_mtp.")
V1_BACKENDS = [ V1_BACKENDS = [
"FLASH_ATTN_VLLM_V1", "FLASH_ATTN_VLLM_V1",
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment