# sleep mode support (enable_sleep_mode comes from vLLM's engine_args)
sleep_mode_level:int=1
# Whether to enable NATS for KV events (derived from kv_events_config in overwrite_args)
# Whether to enable NATS for KV events (derived from kv_events_config in overwrite_args)
use_kv_events:bool=False
use_kv_events:bool=False
...
@@ -301,13 +298,6 @@ def parse_args() -> Config:
...
@@ -301,13 +298,6 @@ def parse_args() -> Config:
default=False,
default=False,
help="Use vLLM's tokenizer for pre and post processing. This bypasses Dynamo's preprocessor and only v1/chat/completions will be available through the Dynamo frontend.",
help="Use vLLM's tokenizer for pre and post processing. This bypasses Dynamo's preprocessor and only v1/chat/completions will be available through the Dynamo frontend.",
Error:fmt.Sprintf("Image mismatch: checkpoint was from '%s' but placeholder uses '%s'. The placeholder must use the same base image. Use skip_image_validation=true to override.",checkpointMeta.Image,containerInfo.Image),