Unverified Commit 5f671cb4 authored by Robert Shaw's avatar Robert Shaw Committed by GitHub
Browse files

[V1] Improve Error Message for Unsupported Config (#12535)


Co-authored-by: default avatarMichael Goin <michael@neuralmagic.com>
parent bd02164c
...@@ -120,13 +120,18 @@ class CudaPlatformBase(Platform): ...@@ -120,13 +120,18 @@ class CudaPlatformBase(Platform):
if parallel_config.worker_cls == "auto": if parallel_config.worker_cls == "auto":
if scheduler_config.is_multi_step: if scheduler_config.is_multi_step:
if envs.VLLM_USE_V1: if envs.VLLM_USE_V1:
raise NotImplementedError raise NotImplementedError(
"Multi-step scheduling is not supported (and not "
"needed) on VLLM V1. Please launch without "
"--num-scheduler-steps.")
else: else:
parallel_config.worker_cls = \ parallel_config.worker_cls = \
"vllm.worker.multi_step_worker.MultiStepWorker" "vllm.worker.multi_step_worker.MultiStepWorker"
elif vllm_config.speculative_config: elif vllm_config.speculative_config:
if envs.VLLM_USE_V1: if envs.VLLM_USE_V1:
raise NotImplementedError raise NotImplementedError(
"Speculative decoding is not yet supported on VLLM V1."
)
else: else:
parallel_config.worker_cls = \ parallel_config.worker_cls = \
"vllm.spec_decode.spec_decode_worker.create_spec_worker" "vllm.spec_decode.spec_decode_worker.create_spec_worker"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment