@@ -63,16 +63,6 @@ class DynamoVllmArgGroup(ArgGroup):
...
@@ -63,16 +63,6 @@ class DynamoVllmArgGroup(ArgGroup):
help="Use vLLM's tokenizer for pre and post processing. This bypasses Dynamo's preprocessor and only v1/chat/completions will be available through the Dynamo frontend.",
help="Use vLLM's tokenizer for pre and post processing. This bypasses Dynamo's preprocessor and only v1/chat/completions will be available through the Dynamo frontend.",
)
)
add_argument(
g,
flag_name="--sleep-mode-level",
env_var="DYN_VLLM_SLEEP_MODE_LEVEL",
default=1,
help="Sleep mode level (1=offload to CPU, 2=discard weights, 3=discard all).",
choices=[1,2,3],
arg_type=int,
)
# Multimodal
# Multimodal
add_negatable_bool_argument(
add_negatable_bool_argument(
g,
g,
...
@@ -178,7 +168,6 @@ class DynamoVllmConfig(ConfigBase):
...
@@ -178,7 +168,6 @@ class DynamoVllmConfig(ConfigBase):
The snapshot-agent no longer reads `basePath` from its ConfigMap, but the operator still uses its configured PVC base path when it annotates checkpoint and restore pods. That path must match `storage.pvc.basePath` here so the mounted checkpoint location is valid inside the agent pod.
Cross-node restore requires a shared `ReadWriteMany` storage class. The chart defaults to `storage.pvc.accessMode=ReadWriteMany`.
Cross-node restore requires a shared `ReadWriteMany` storage class. The chart defaults to `storage.pvc.accessMode=ReadWriteMany`.
For better restore times, use a fast `ReadWriteMany` StorageClass for the checkpoint PVC.
For better restore times, use a fast `ReadWriteMany` StorageClass for the checkpoint PVC.
// +kubebuilder:validation:XValidation:rule="!(self.disabled && has(self.size))",message="sharedMemory.size must not be set when sharedMemory.disabled is true"
typeSharedMemorySpecstruct{
typeSharedMemorySpecstruct{
Disabledbool`json:"disabled,omitempty"`
Disabledbool`json:"disabled,omitempty"`
Sizeresource.Quantity`json:"size,omitempty"`
Sizeresource.Quantity`json:"size,omitempty"`
...
@@ -192,8 +193,8 @@ type ServiceCheckpointConfig struct {
...
@@ -192,8 +193,8 @@ type ServiceCheckpointConfig struct {
// +kubebuilder:default=Auto
// +kubebuilder:default=Auto
ModeCheckpointMode`json:"mode,omitempty"`
ModeCheckpointMode`json:"mode,omitempty"`
// CheckpointRef references an existing Checkpoint CR to use
// CheckpointRef references an existing DynamoCheckpoint CR by metadata.name.
// If specified, Identity is ignored and this checkpoint is used directly
// If specified, this service's Identity is ignored and the referenced checkpoint is used directly.