feat: Add v1beta1 DGDR API with conversion framework (#6352)

Signed-off-by: Jont828 <jt572@cornell.edu> Signed-off-by: Hongkuan Zhou <hongkuanz@nvidia.com> Signed-off-by: Hannah Zhang <hannahz@nvidia.com> Co-authored-by: Jont828 <jt572@cornell.edu>

feat: Add v1beta1 DGDR API with conversion framework (#6352)
Signed-off-by: Jont828 <jt572@cornell.edu> Signed-off-by: Hongkuan Zhou <hongkuanz@nvidia.com> Signed-off-by: Hannah Zhang <hannahz@nvidia.com> Co-authored-by: Jont828 <jt572@cornell.edu>
ebc61637 · hhzhang16 · GitHub · 7bbacce1 · ebc61637 · ebc61637
Unverified Commit ebc61637 authored Feb 19, 2026 by hhzhang16 Committed by GitHub Feb 19, 2026
20 changed files
--- a/.github/workflows/pr.yaml
+++ b/.github/workflows/pr.yaml
@@ -117,6 +117,16 @@ jobs:
        uses: actions/setup-go@44694675825211faa026b3c33043df3e48a5fa00 # v6.0.0
        with:
          go-version: '1.25'
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+      - name: Install Python dependencies for operator codegen
+        shell: bash
+        working-directory: ./deploy/operator
+        run: |
+          python -m pip install --upgrade pip
+          python -m pip install "pydantic>=2,<3" "black==23.1.0"
      - name: Check for uncommitted changes
        shell: bash
        working-directory: ./deploy/operator

--- a/components/src/dynamo/profiler/utils/dgdr_v1beta1_types.py
+++ b/components/src/dynamo/profiler/utils/dgdr_v1beta1_types.py
+# SPDX-FileCopyrightText: Copyright (c) 2024-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Auto-generated Pydantic models from v1beta1 DGDR Go types.
+
+Generated by: deploy/operator/api/scripts/generate_pydantic_from_go.py
+Source: deploy/operator/api/v1beta1/dynamographdeploymentrequest_types.go
+
+DO NOT EDIT MANUALLY - regenerate using the script.
+"""
+
+from enum import Enum
+from typing import Any, Dict, List, Optional
+
+from pydantic import BaseModel, Field, model_validator
+
+
+class DGDRPhase(str, Enum):
+    Pending = "Pending"
+    Profiling = "Profiling"
+    Ready = "Ready"
+    Deploying = "Deploying"
+    Deployed = "Deployed"
+    Failed = "Failed"
+
+
+class ProfilingPhase(str, Enum):
+    Initializing = "Initializing"
+    SweepingPrefill = "SweepingPrefill"
+    SweepingDecode = "SweepingDecode"
+    SelectingConfig = "SelectingConfig"
+    BuildingCurves = "BuildingCurves"
+    GeneratingDGD = "GeneratingDGD"
+    Done = "Done"
+
+
+class OptimizationType(str, Enum):
+    Latency = "latency"
+    Throughput = "throughput"
+
+
+class SearchStrategy(str, Enum):
+    Rapid = "rapid"
+    Thorough = "thorough"
+
+
+class BackendType(str, Enum):
+    Auto = "auto"
+    Sglang = "sglang"
+    Trtllm = "trtllm"
+    Vllm = "vllm"
+
+
+class PlannerPreDeploymentSweepMode(str, Enum):
+    None_ = "none"
+    Rapid = "rapid"
+    Thorough = "thorough"
+
+
+class WorkloadSpec(BaseModel):
+    """WorkloadSpec defines the workload characteristics for SLA-based profiling."""
+
+    isl: Optional[int] = Field(
+        default=4000, description="ISL is the Input Sequence Length (number of tokens)."
+    )
+    osl: Optional[int] = Field(
+        default=1000,
+        description="OSL is the Output Sequence Length (number of tokens).",
+    )
+    concurrency: Optional[float] = Field(
+        default=None,
+        description="Concurrency is the target concurrency level. Required (or RequestRate) when the planner is disabled.",
+    )
+    requestRate: Optional[float] = Field(
+        default=None,
+        description="RequestRate is the target request rate (req/s). Required (or Concurrency) when the planner is disabled.",
+    )
+
+
+class SLASpec(BaseModel):
+    """Service-level agreement targets.
+
+    Provide exactly one of:
+
+    - ``ttft`` + ``itl``: explicit latency targets (default: 2000 ms / 30 ms)
+    - ``e2eLatency``: end-to-end latency target
+    - ``optimizationType``: high-level objective without explicit numeric targets"""
+
+    optimizationType: Optional[OptimizationType] = Field(
+        default=None,
+        description="OptimizationType controls the profiling optimization strategy. Use when explicit SLA targets (ttft+itl or e2eLatency) are not known.",
+    )
+    ttft: Optional[float] = Field(
+        default=2000,
+        description="TTFT is the Time To First Token target in milliseconds.",
+    )
+    itl: Optional[float] = Field(
+        default=30, description="ITL is the Inter-Token Latency target in milliseconds."
+    )
+    e2eLatency: Optional[float] = Field(
+        default=None,
+        description="E2ELatency is the target end-to-end request latency in milliseconds. Alternative to specifying TTFT + ITL.",
+    )
+
+    @model_validator(mode="after")
+    def _validate_sla_options(self) -> "SLASpec":
+        """Ensure at most one SLA mode is active."""
+        has_ttft_itl = self.ttft is not None and self.itl is not None
+        has_e2e = self.e2eLatency is not None
+        has_opt = self.optimizationType is not None
+        options_count = sum([has_ttft_itl, has_e2e, has_opt])
+        if options_count > 1:
+            raise ValueError(
+                "SLA must specify exactly one of: (ttft and itl), e2eLatency, "
+                "or optimizationType — not multiple."
+            )
+        if (self.ttft is not None) != (self.itl is not None):
+            raise ValueError("ttft and itl must both be provided together.")
+        return self
+
+
+class ModelCacheSpec(BaseModel):
+    """ModelCacheSpec references a PVC containing pre-downloaded model weights."""
+
+    pvcName: Optional[str] = Field(
+        default=None,
+        description="PVCName is the name of the PersistentVolumeClaim containing model weights. The PVC must exist in the same namespace as the DGDR.",
+    )
+    pvcModelPath: Optional[str] = Field(
+        default=None,
+        description='PVCModelPath is the path to the model checkpoint directory within the PVC (e.g. "deepseek-r1" or "models/Llama-3.1-405B-FP8").',
+    )
+    pvcMountPath: str = Field(
+        default="/opt/model-cache",
+        description="PVCMountPath is the mount path for the PVC inside the container.",
+    )
+
+
+class OverridesSpec(BaseModel):
+    """OverridesSpec allows customizing the profiling job and the generated DynamoGraphDeployment."""
+
+    profilingJob: Optional[Dict[str, Any]] = Field(
+        default=None,
+        description="ProfilingJob allows overriding the profiling Job specification. Fields set here are merged into the controller-generated Job spec.",
+    )
+    dgd: Optional[Dict[str, Any]] = Field(
+        default=None,
+        description="DGD allows providing a full or partial nvidia.com/v1alpha1 DynamoGraphDeployment to use as the base for the generated deployment. Fields from profiling results are merged on top. Use this to override backend worker images.  The field is stored as a raw embedded resource rather than a typed *v1alpha1.DynamoGraphDeployment to avoid a circular import: v1alpha1 already imports v1beta1 as the conversion hub and Go does not allow import cycles.  The EmbeddedResource marker tells the API server to validate that the value is a well-formed Kubernetes object (has apiVersion/kind), but does not enforce that it is specifically a DynamoGraphDeployment. Full type validation (correct apiVersion, kind, and field schema) is performed by the controller during reconciliation. TODO(future MR): add webhook admission validation for the DGD field type.",
+    )
+
+
+class PlannerSpec(BaseModel):
+    """PlannerSpec configures the SLA planner for autoscaling in the generated DGD."""
+
+    enabled: Optional[bool] = Field(
+        default=None, description="Enabled indicates whether the planner is enabled."
+    )
+    plannerPreDeploymentSweeping: Optional[PlannerPreDeploymentSweepMode] = Field(
+        default=None,
+        description='PlannerPreDeploymentSweeping controls pre-deployment sweeping mode for planner in-depth profiling. "none" means no pre-deployment sweep (only load-based scaling). "rapid" uses AI Configurator to simulate engine performance. "thorough" uses real GPUs to measure engine performance (takes several hours).',
+    )
+    plannerArgsList: Optional[List[str]] = Field(
+        default=None,
+        description="PlannerArgsList is a list of additional planner arguments.",
+    )
+
+
+class MockerSpec(BaseModel):
+    """MockerSpec configures the simulated (mocker) backend."""
+
+    enabled: Optional[bool] = Field(
+        default=None,
+        description="Enabled indicates whether to deploy mocker workers instead of real inference workers. Useful for large-scale testing without GPUs.",
+    )
+
+
+class KVRouterSpec(BaseModel):
+    """KVRouterSpec configures KV-cache-aware routing."""
+
+    enabled: Optional[bool] = Field(
+        default=None,
+        description="Enabled indicates whether to enable KV-cache-aware routing in the generated DGD. KV routing optimizes request scheduling based on KV cache locality.",
+    )
+
+
+class FeaturesSpec(BaseModel):
+    """FeaturesSpec controls optional Dynamo platform features in the generated deployment."""
+
+    planner: Optional[PlannerSpec] = Field(
+        default=None,
+        description="Planner configures the SLA planner for autoscaling in the generated DGD.",
+    )
+    mocker: Optional[MockerSpec] = Field(
+        default=None,
+        description="Mocker configures the simulated (mocker) backend for testing without GPUs.",
+    )
+
+
+class HardwareSpec(BaseModel):
+    """HardwareSpec describes the hardware resources available for profiling and deployment. These fields are typically auto-filled by the operator from cluster discovery."""
+
+    gpuSku: Optional[str] = Field(
+        default=None,
+        description='GPUSKU is the GPU SKU identifier (e.g., "H100_SXM", "A100_80GB").',
+    )
+    vramMb: Optional[float] = Field(
+        default=None, description="VRAMMB is the VRAM per GPU in MiB."
+    )
+    totalGpus: Optional[int] = Field(
+        default=None,
+        description="TotalGPUs is the total number of GPUs available in the cluster.",
+    )
+    numGpusPerNode: Optional[int] = Field(
+        default=None, description="NumGPUsPerNode is the number of GPUs per node."
+    )
+
+
+class DynamoGraphDeploymentRequestSpec(BaseModel):
+    """DynamoGraphDeploymentRequestSpec defines the desired state of a DynamoGraphDeploymentRequest. Only the Model field is required; all other fields are optional and have sensible defaults."""
+
+    model: str = Field(
+        description='Model specifies the model to deploy (e.g., "Qwen/Qwen3-0.6B", "meta-llama/Llama-3-70b"). Can be a HuggingFace ID or a private model name.'
+    )
+    backend: BackendType = Field(
+        default="auto",
+        description="Backend specifies the inference backend to use for profiling and deployment.",
+    )
+    image: Optional[str] = Field(
+        default=None,
+        description='Image is the container image reference for the profiling job (frontend image). Example: "nvcr.io/nvidia/dynamo-runtime:latest" TODO: In a future MR, the operator will derive the backend inference image from the backend type automatically; backend images can be overridden via overrides.dgd.',
+    )
+    modelCache: Optional[ModelCacheSpec] = Field(
+        default=None,
+        description="ModelCache provides optional PVC configuration for pre-downloaded model weights. When provided, weights are loaded from the PVC instead of downloading from HuggingFace.",
+    )
+    hardware: Optional[HardwareSpec] = Field(
+        default=None,
+        description="Hardware describes the hardware resources available for profiling and deployment. Typically auto-filled by the operator from cluster discovery.",
+    )
+    workload: Optional[WorkloadSpec] = Field(
+        default=None,
+        description="Workload defines the expected workload characteristics for SLA-based profiling.",
+    )
+    sla: Optional[SLASpec] = Field(
+        default=None,
+        description="SLA defines service-level agreement targets that drive profiling optimization.",
+    )
+    overrides: Optional[OverridesSpec] = Field(
+        default=None,
+        description="Overrides allows customizing the profiling job and the generated DynamoGraphDeployment.",
+    )
+    features: Optional[FeaturesSpec] = Field(
+        default=None,
+        description="Features controls optional Dynamo platform features in the generated deployment.",
+    )
+    searchStrategy: SearchStrategy = Field(
+        default="rapid",
+        description='SearchStrategy controls the profiling search depth. "rapid" performs a fast sweep; "thorough" explores more configurations.',
+    )
+    autoApply: bool = Field(
+        default=True,
+        description="AutoApply indicates whether to automatically create a DynamoGraphDeployment after profiling completes. If false, the generated spec is stored in status for manual review and application.",
+    )
+
+
+class ParetoConfig(BaseModel):
+    """ParetoConfig represents a single Pareto-optimal deployment configuration discovered during profiling."""
+
+    config: Dict[str, Any] = Field(
+        description="Config is the full deployment configuration for this Pareto point."
+    )
+
+
+class ProfilingResultsStatus(BaseModel):
+    """ProfilingResultsStatus contains the output of the profiling process."""
+
+    pareto: Optional[List[ParetoConfig]] = Field(
+        default=None,
+        description="Pareto is the list of Pareto-optimal deployment configurations discovered during profiling. Each entry represents a different cost/performance trade-off.",
+    )
+    selectedConfig: Optional[Dict[str, Any]] = Field(
+        default=None,
+        description="SelectedConfig is the recommended configuration chosen by the profiler based on the SLA targets. This is the configuration used for deployment when autoApply is true.",
+    )
+
+
+class DeploymentInfoStatus(BaseModel):
+    """DeploymentInfoStatus tracks the state of the deployed DynamoGraphDeployment."""
+
+    replicas: Optional[int] = Field(
+        default=None, description="Replicas is the desired number of replicas."
+    )
+    availableReplicas: Optional[int] = Field(
+        default=None,
+        description="AvailableReplicas is the number of replicas that are available and ready.",
+    )
+
+
+class DynamoGraphDeploymentRequestStatus(BaseModel):
+    """DynamoGraphDeploymentRequestStatus represents the observed state of a DynamoGraphDeploymentRequest."""
+
+    phase: Optional[DGDRPhase] = Field(
+        default=None,
+        description="Phase is the high-level lifecycle phase of the deployment request.",
+    )
+    profilingPhase: Optional[ProfilingPhase] = Field(
+        default=None,
+        description='ProfilingPhase indicates the current sub-phase of the profiling pipeline. Only meaningful when Phase is "Profiling". Cleared when profiling completes or fails.',
+    )
+    dgdName: Optional[str] = Field(
+        default=None,
+        description="DGDName is the name of the generated or created DynamoGraphDeployment.",
+    )
+    profilingJobName: Optional[str] = Field(
+        default=None,
+        description="ProfilingJobName is the name of the Kubernetes Job running the profiler.",
+    )
+    profilingResults: Optional[ProfilingResultsStatus] = Field(
+        default=None,
+        description="ProfilingResults contains the output of the profiling process including Pareto-optimal configurations and the selected deployment configuration.",
+    )
+    deploymentInfo: Optional[DeploymentInfoStatus] = Field(
+        default=None,
+        description="DeploymentInfo tracks the state of the deployed DynamoGraphDeployment. Populated when a DGD has been created (either via autoApply or manually).",
+    )
+    observedGeneration: Optional[int] = Field(
+        default=None,
+        description="ObservedGeneration is the most recent generation observed by the controller.",
+    )
+
+
+class DynamoGraphDeploymentRequest(BaseModel):
+    """DynamoGraphDeploymentRequest is the Schema for the dynamographdeploymentrequests API. It provides a simplified, SLA-driven interface for deploying inference models on Dynamo. Users specify a model and optional performance targets; the controller handles profiling, configuration selection, and deployment."""
+
+    spec: Optional[DynamoGraphDeploymentRequestSpec] = Field(
+        default=None,
+        description="Spec defines the desired state for this deployment request.",
+    )
+    status: Optional[DynamoGraphDeploymentRequestStatus] = Field(
+        default=None,
+        description="Status reflects the current observed state of this deployment request.",
+    )
--- a/deploy/helm/charts/crds/templates/nvidia.com_dynamographdeploymentrequests.yaml
+++ b/deploy/helm/charts/crds/templates/nvidia.com_dynamographdeploymentrequests.yaml
--- a/deploy/helm/charts/platform/components/operator/templates/webhook-ca-inject-job.yaml
+++ b/deploy/helm/charts/platform/components/operator/templates/webhook-ca-inject-job.yaml
@@ -106,6 +106,10 @@ rules:
  resourceNames: ["{{ include "dynamo-operator.fullname" . }}-mutating"]
  {{- end }}
  verbs: ["get", "patch"]
+- apiGroups: ["apiextensions.k8s.io"]
+  resources: ["customresourcedefinitions"]
+  resourceNames: ["dynamographdeploymentrequests.nvidia.com"]
+  verbs: ["get", "patch"]
 ---
 apiVersion: rbac.authorization.k8s.io/v1
 kind: ClusterRoleBinding
@@ -253,6 +257,29 @@ spec:
              }
            ]"

+          echo "📝 Patching DGDR CRD spec.conversion..."
+          # Set the full conversion block (strategy + service + caBundle) in one merge patch.
+          # This is idempotent: safe to run on install and upgrade.
+          kubectl patch crd dynamographdeploymentrequests.nvidia.com \
+            --type merge --patch "{
+              \"spec\": {
+                \"conversion\": {
+                  \"strategy\": \"Webhook\",
+                  \"webhook\": {
+                    \"clientConfig\": {
+                      \"service\": {
+                        \"name\": \"{{ include "dynamo-operator.fullname" . }}-webhook-service\",
+                        \"namespace\": \"{{ .Release.Namespace }}\",
+                        \"path\": \"/convert\"
+                      },
+                      \"caBundle\": \"${CA_BUNDLE}\"
+                    },
+                    \"conversionReviewVersions\": [\"v1\"]
+                  }
+                }
+              }
+            }"
+
          echo "✅ CA bundle injected successfully!"
          echo "🎉 Webhook configuration complete!"
        securityContext:

--- a/deploy/helm/charts/platform/components/operator/templates/webhook-crd-conversion-certmanager.yaml
+++ b/deploy/helm/charts/platform/components/operator/templates/webhook-crd-conversion-certmanager.yaml
+# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+{{- if and .Values.webhook.enabled .Values.webhook.certManager.enabled }}
+---
+# ServiceAccount for the CRD conversion patch job
+apiVersion: v1
+kind: ServiceAccount
+metadata:
+  name: {{ include "dynamo-operator.fullname" . }}-crd-conversion-patch
+  namespace: {{ .Release.Namespace }}
+  labels:
+    app.kubernetes.io/component: webhook
+    app.kubernetes.io/created-by: dynamo-operator
+    app.kubernetes.io/part-of: dynamo-operator
+  {{- include "dynamo-operator.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": post-install,post-upgrade
+    "helm.sh/hook-weight": "1"
+    "helm.sh/hook-delete-policy": before-hook-creation
+---
+# ClusterRole to patch the DGDR CRD
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRole
+metadata:
+  name: {{ include "dynamo-operator.fullname" . }}-crd-conversion-patch
+  labels:
+    app.kubernetes.io/component: webhook
+    app.kubernetes.io/created-by: dynamo-operator
+    app.kubernetes.io/part-of: dynamo-operator
+  {{- include "dynamo-operator.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": post-install,post-upgrade
+    "helm.sh/hook-weight": "1"
+    "helm.sh/hook-delete-policy": before-hook-creation
+rules:
+- apiGroups: ["apiextensions.k8s.io"]
+  resources: ["customresourcedefinitions"]
+  resourceNames: ["dynamographdeploymentrequests.nvidia.com"]
+  verbs: ["get", "patch"]
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: {{ include "dynamo-operator.fullname" . }}-crd-conversion-patch
+  labels:
+    app.kubernetes.io/component: webhook
+    app.kubernetes.io/created-by: dynamo-operator
+    app.kubernetes.io/part-of: dynamo-operator
+  {{- include "dynamo-operator.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": post-install,post-upgrade
+    "helm.sh/hook-weight": "1"
+    "helm.sh/hook-delete-policy": before-hook-creation
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: {{ include "dynamo-operator.fullname" . }}-crd-conversion-patch
+subjects:
+- kind: ServiceAccount
+  name: {{ include "dynamo-operator.fullname" . }}-crd-conversion-patch
+  namespace: {{ .Release.Namespace }}
+---
+# Job to patch the DGDR CRD with spec.conversion and cert-manager CA injection annotation.
+# The cert-manager ca-injector then watches the CRD annotation and keeps the caBundle
+# in spec.conversion.webhook.clientConfig.caBundle up to date automatically.
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: {{ include "dynamo-operator.fullname" . }}-crd-conversion-patch-{{ .Release.Revision }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    app.kubernetes.io/component: webhook
+    app.kubernetes.io/created-by: dynamo-operator
+    app.kubernetes.io/part-of: dynamo-operator
+  {{- include "dynamo-operator.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": post-install,post-upgrade
+    "helm.sh/hook-weight": "2"
+    "helm.sh/hook-delete-policy": before-hook-creation
+spec:
+  backoffLimit: 5
+  template:
+    metadata:
+      name: {{ include "dynamo-operator.fullname" . }}-crd-conversion-patch
+      labels:
+        app.kubernetes.io/component: webhook
+        app.kubernetes.io/created-by: dynamo-operator
+        app.kubernetes.io/part-of: dynamo-operator
+      {{- include "dynamo-operator.labels" . | nindent 8 }}
+    spec:
+      serviceAccountName: {{ include "dynamo-operator.fullname" . }}-crd-conversion-patch
+      restartPolicy: OnFailure
+      {{- with .Values.controllerManager.tolerations }}
+      tolerations:
+        {{- toYaml . | nindent 8 }}
+      {{- end }}
+      {{- with .Values.controllerManager.affinity }}
+      affinity:
+        {{- toYaml . | nindent 8 }}
+      {{- end }}
+      containers:
+      - name: crd-conversion-patch
+        image: {{ .Values.webhook.certGenerator.image.repository }}:{{ .Values.webhook.certGenerator.image.tag }}
+        imagePullPolicy: {{ .Values.webhook.certGenerator.image.pullPolicy }}
+        command:
+        - /bin/bash
+        - -c
+        - |
+          set -e
+
+          echo "📝 Patching DGDR CRD with spec.conversion and cert-manager CA injection annotation..."
+
+          # Set spec.conversion (caBundle left empty — cert-manager ca-injector fills it in
+          # automatically once it sees the cert-manager.io/inject-ca-from annotation below).
+          kubectl patch crd dynamographdeploymentrequests.nvidia.com \
+            --type merge --patch '{
+              "spec": {
+                "conversion": {
+                  "strategy": "Webhook",
+                  "webhook": {
+                    "clientConfig": {
+                      "service": {
+                        "name": "{{ include "dynamo-operator.fullname" . }}-webhook-service",
+                        "namespace": "{{ .Release.Namespace }}",
+                        "path": "/convert"
+                      }
+                    },
+                    "conversionReviewVersions": ["v1"]
+                  }
+                }
+              }
+            }'
+
+          # Add the cert-manager annotation so the ca-injector keeps the caBundle current.
+          kubectl annotate crd dynamographdeploymentrequests.nvidia.com \
+            --overwrite \
+            cert-manager.io/inject-ca-from="{{ .Release.Namespace }}/{{ include "dynamo-operator.fullname" . }}-serving-cert"
+
+          echo "✅ DGDR CRD conversion webhook configured."
+          echo "   cert-manager ca-injector will populate the caBundle automatically."
+        securityContext:
+          allowPrivilegeEscalation: false
+          capabilities:
+            drop:
+            - ALL
+          readOnlyRootFilesystem: true
+          runAsNonRoot: true
+          runAsUser: 1001
+{{- end }}
--- a/deploy/operator/Dockerfile
+++ b/deploy/operator/Dockerfile
@@ -13,8 +13,9 @@ ARG TARGETARCH

 RUN echo "Building for ${TARGETOS}/${TARGETARCH}"

-# Install common dependencies
-RUN apt-get update && apt-get install -y --no-install-recommends git && apt-get clean && rm -rf /var/lib/apt/lists/*
+# Install common dependencies (python3-pip needed for generate-pydantic target)
+RUN apt-get update && apt-get install -y --no-install-recommends git python3-pip && apt-get clean && rm -rf /var/lib/apt/lists/* \
+    && pip3 install --no-cache-dir pydantic --break-system-packages

 WORKDIR /workspace


--- a/deploy/operator/Makefile
+++ b/deploy/operator/Makefile
@@ -141,9 +141,17 @@ manifests: controller-gen ensure-yq ## Generate WebhookConfiguration, ClusterRol
 	done

 .PHONY: generate
-generate: controller-gen ## Generate code containing DeepCopy, DeepCopyInto, and DeepCopyObject method implementations.
+generate: controller-gen generate-pydantic ## Generate code containing DeepCopy, DeepCopyInto, and DeepCopyObject method implementations.
 	$(CONTROLLER_GEN) object:headerFile="hack/boilerplate.go.txt_" paths="./..."

+.PHONY: generate-pydantic
+generate-pydantic: ## Generate Python Pydantic models from v1beta1 Go types (requires Python 3 + pydantic)
+	@python3 -c "import pydantic" 2>/dev/null || { echo "Error: pydantic not found. Install with: pip install pydantic"; exit 1; }
+	@echo "Generating Pydantic models from v1beta1 DGDR types..."
+	@python3 api/scripts/generate_pydantic_from_go.py
+	@echo "Running Pydantic validation tests..."
+	@python3 api/scripts/test_pydantic_models.py
+
 .PHONY: fmt
 fmt: ## Run go fmt against code.
 	go fmt ./...
@@ -330,6 +338,9 @@ generate-api-docs: crd-ref-docs ## Generate API reference documentation from CRD
 	cat docs/header.md ./docs/api_reference.md docs/footer.md > ../../docs/pages/kubernetes/api-reference.md
 	rm ./docs/api_reference.md
 	@echo "✅ Concatenated header.md, api_reference.md, and footer.md"
+	# Fix duplicate anchors: crd-ref-docs generates identical anchors for same-named types
+	# across API versions; prepend "v1beta1 " to affected v1beta1 headings and links.
+	python3 docs/fix-api-anchors.py ../../docs/pages/kubernetes/api-reference.md

 .PHONY: coverage
 coverage: test

--- a/deploy/operator/PROJECT
+++ b/deploy/operator/PROJECT
@@ -6,7 +6,7 @@ domain: nvidia.com
 layout:
 - go.kubebuilder.io/v4
 projectName: dynamo-kubernetes-operator
-repo: github.com/ai-dynamo/dynamo/deploy/operator/api/v1alpha1
+repo: github.com/ai-dynamo/dynamo/deploy/operator
 resources:
 - api:
    crdVersion: v1

--- a/deploy/operator/api/scripts/generate_pydantic_from_go.py
+++ b/deploy/operator/api/scripts/generate_pydantic_from_go.py
--- a/deploy/operator/api/scripts/test_pydantic_models.py
+++ b/deploy/operator/api/scripts/test_pydantic_models.py
+#!/usr/bin/env python3
+# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Test script for v1beta1 Pydantic models.
+
+Validates that the generated Pydantic models can be imported and used correctly.
+"""
+
+import subprocess
+import sys
+from pathlib import Path
+
+
+def _repo_root() -> Path:
+    start = Path(__file__).parent
+    try:
+        result = subprocess.run(
+            ["git", "rev-parse", "--show-toplevel"],
+            capture_output=True,
+            text=True,
+            check=True,
+            cwd=start,
+        )
+        return Path(result.stdout.strip())
+    except (subprocess.CalledProcessError, FileNotFoundError):
+        pass
+    # Fallback: walk up until we find go.mod (same logic as generate_pydantic_from_go.py)
+    p = start
+    while p != p.parent:
+        if (p / "go.mod").exists():
+            return p
+        p = p.parent
+    return start
+
+
+# Add the components src to path so we can import the generated models
+sys.path.insert(0, str(_repo_root() / "components" / "src"))
+
+import pydantic  # noqa: E402
+
+from dynamo.profiler.utils.dgdr_v1beta1_types import (  # noqa: E402
+    BackendType,
+    DeploymentInfoStatus,
+    DGDRPhase,
+    DynamoGraphDeploymentRequestSpec,
+    DynamoGraphDeploymentRequestStatus,
+    FeaturesSpec,
+    MockerSpec,
+    ModelCacheSpec,
+    OptimizationType,
+    PlannerPreDeploymentSweepMode,
+    PlannerSpec,
+    ProfilingPhase,
+    SearchStrategy,
+    SLASpec,
+    WorkloadSpec,
+)
+
+print("✓ Successfully imported all Pydantic models")
+
+
+def test_simple_dgdr():
+    """Test creating a simple DGDR (minimal spec)"""
+    spec = DynamoGraphDeploymentRequestSpec(
+        model="Qwen/Qwen3-32B",
+    )
+    print("✓ Created simple DGDR spec")
+
+    assert spec.model == "Qwen/Qwen3-32B"
+    assert spec.backend == BackendType.Auto  # kubebuilder:default=auto
+    assert spec.autoApply is True  # kubebuilder:default=true
+    print("✓ Simple DGDR spec validation passed")
+
+
+def test_full_dgdr():
+    """Test creating a full DGDR with all fields"""
+    spec = DynamoGraphDeploymentRequestSpec(
+        model="meta-llama/Llama-3.1-405B",
+        backend=BackendType.Vllm,
+        image="nvcr.io/nvidia/dynamo-runtime:latest",
+        workload=WorkloadSpec(
+            isl=1024,
+            osl=512,
+            concurrency=10.0,
+        ),
+        sla=SLASpec(
+            ttft=100.0,
+            itl=10.0,
+        ),
+        modelCache=ModelCacheSpec(
+            pvcName="model-cache",
+            pvcModelPath="llama-3.1-405b",
+        ),
+        features=FeaturesSpec(
+            planner=PlannerSpec(enabled=True),
+            mocker=MockerSpec(enabled=False),
+        ),
+        searchStrategy=SearchStrategy.Rapid,
+        autoApply=True,
+    )
+    print("✓ Created full DGDR spec")
+
+    assert spec.model == "meta-llama/Llama-3.1-405B"
+    assert spec.backend == BackendType.Vllm
+    assert spec.workload.isl == 1024
+    assert spec.sla.ttft == 100.0
+    assert spec.sla.itl == 10.0
+    assert spec.modelCache.pvcName == "model-cache"
+    assert spec.modelCache.pvcModelPath == "llama-3.1-405b"
+    assert spec.features.planner.enabled is True
+    assert spec.features.mocker.enabled is False
+    print("✓ Full DGDR spec validation passed")
+
+
+def test_sla_defaults_and_validation():
+    """Test SLASpec defaults and mutual-exclusivity validator"""
+    # Default mode: ttft + itl with python-defaults
+    sla = SLASpec()
+    assert sla.ttft == 2000.0
+    assert sla.itl == 30.0
+    assert sla.e2eLatency is None
+    assert sla.optimizationType is None
+    print("✓ SLASpec defaults correct")
+
+    # explicit ttft+itl mode: OK
+    SLASpec(ttft=100.0, itl=10.0)
+
+    # e2eLatency mode: OK (null out ttft/itl)
+    SLASpec(ttft=None, itl=None, e2eLatency=500.0)
+
+    # optimizationType mode: OK (null out ttft/itl)
+    SLASpec(ttft=None, itl=None, optimizationType=OptimizationType.Throughput)
+
+    # mixing modes should raise
+    try:
+        SLASpec(ttft=100.0, itl=10.0, e2eLatency=500.0)
+        raise AssertionError("expected ValidationError for mixed SLA modes")
+    except pydantic.ValidationError:
+        pass
+
+    # ttft without itl should raise
+    try:
+        SLASpec(itl=None, ttft=100.0)
+        raise AssertionError("expected ValidationError for ttft without itl")
+    except pydantic.ValidationError:
+        pass
+
+    print("✓ SLASpec validation correct")
+
+
+def test_workload_defaults():
+    """Test WorkloadSpec kubebuilder defaults"""
+    w = WorkloadSpec()
+    assert w.isl == 4000
+    assert w.osl == 1000
+    print("✓ WorkloadSpec defaults correct")
+
+
+def test_enums():
+    """Test enum values"""
+    # DGDRPhase — TitleCase suffix from Go const names
+    assert DGDRPhase.Pending == "Pending"
+    assert DGDRPhase.Profiling == "Profiling"
+    assert DGDRPhase.Deployed == "Deployed"
+
+    # ProfilingPhase — TitleCase suffix from Go const names
+    assert ProfilingPhase.Initializing == "Initializing"
+    assert ProfilingPhase.SweepingPrefill == "SweepingPrefill"
+
+    # OptimizationType — TitleCase from Go const names
+    assert OptimizationType.Latency == "latency"
+    assert OptimizationType.Throughput == "throughput"
+
+    # SearchStrategy — TitleCase from Go const names
+    assert SearchStrategy.Rapid == "rapid"
+    assert SearchStrategy.Thorough == "thorough"
+
+    # BackendType — mixed case from Go const names
+    assert BackendType.Auto == "auto"
+    assert BackendType.Vllm == "vllm"
+
+    # PlannerPreDeploymentSweepMode (None → None_ to avoid Python keyword clash)
+    assert PlannerPreDeploymentSweepMode.None_ == "none"
+    assert PlannerPreDeploymentSweepMode.Rapid == "rapid"
+
+    print("✓ All enum values validated")
+
+
+def test_status_models():
+    """Test status model creation"""
+    status = DynamoGraphDeploymentRequestStatus(
+        phase=DGDRPhase.Profiling,
+        profilingPhase=ProfilingPhase.SweepingPrefill,
+        dgdName="test-dgd",
+        profilingJobName="test-profiling-job",
+        deploymentInfo=DeploymentInfoStatus(
+            replicas=3,
+            availableReplicas=2,
+        ),
+    )
+    print("✓ Created DGDR status")
+
+    assert status.phase == DGDRPhase.Profiling
+    assert status.profilingPhase == ProfilingPhase.SweepingPrefill
+    assert status.deploymentInfo.replicas == 3
+    print("✓ DGDR status validation passed")
+
+
+def main():
+    """Run all tests"""
+    print("\n" + "=" * 60)
+    print("Testing v1beta1 Pydantic Models")
+    print("=" * 60 + "\n")
+
+    test_simple_dgdr()
+    test_full_dgdr()
+    test_sla_defaults_and_validation()
+    test_workload_defaults()
+    test_enums()
+    test_status_models()
+
+    print("\n" + "=" * 60)
+    print("All tests passed! ✓")
+    print("=" * 60 + "\n")
+
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
--- a/deploy/operator/api/v1alpha1/dynamographdeploymentrequest_conversion.go
+++ b/deploy/operator/api/v1alpha1/dynamographdeploymentrequest_conversion.go
--- a/deploy/operator/api/v1alpha1/dynamographdeploymentrequest_conversion_test.go
+++ b/deploy/operator/api/v1alpha1/dynamographdeploymentrequest_conversion_test.go
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: Apache-2.0
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package v1alpha1
+
+import (
+	"encoding/json"
+	"testing"
+
+	v1beta1 "github.com/ai-dynamo/dynamo/deploy/operator/api/v1beta1"
+	apiextensionsv1 "k8s.io/apiextensions-apiserver/pkg/apis/apiextensions/v1"
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	runtime "k8s.io/apimachinery/pkg/runtime"
+)
+
+// newV1alpha1DGDR builds a fully-populated v1alpha1 DGDR for use in tests.
+func newV1alpha1DGDR() *DynamoGraphDeploymentRequest {
+	profilingBlob := map[string]interface{}{
+		"sla": map[string]interface{}{
+			"ttft": float64(500),
+			"itl":  float64(20),
+			"isl":  float64(2048),
+			"osl":  float64(512),
+		},
+		"deployment": map[string]interface{}{
+			"modelCache": map[string]interface{}{
+				"pvcName":        "model-pvc",
+				"modelPathInPvc": "llama-3",
+				"pvcMountPath":   "/data/model",
+			},
+		},
+		"extra_key": "preserved",
+	}
+	blobRaw, _ := json.Marshal(profilingBlob)
+
+	trueVal := true
+	return &DynamoGraphDeploymentRequest{
+		ObjectMeta: metav1.ObjectMeta{
+			Name:      "test-dgdr",
+			Namespace: "default",
+		},
+		Spec: DynamoGraphDeploymentRequestSpec{
+			Model:     "meta-llama/Llama-3.1-8B",
+			Backend:   "vllm",
+			AutoApply: true,
+			UseMocker: true,
+			ProfilingConfig: ProfilingConfigSpec{
+				ProfilerImage: "nvcr.io/nvidia/dynamo:latest",
+				OutputPVC:     "output-pvc",
+				Config:        &apiextensionsv1.JSON{Raw: blobRaw},
+				ConfigMapRef:  &ConfigMapKeySelector{Name: "base-config", Key: "disagg.yaml"},
+			},
+			EnableGPUDiscovery: &trueVal,
+			DeploymentOverrides: &DeploymentOverridesSpec{
+				Name:      "my-dgd",
+				Namespace: "prod",
+				Labels:    map[string]string{"team": "ml"},
+			},
+		},
+		Status: DynamoGraphDeploymentRequestStatus{
+			State:              DGDRStateProfiling,
+			Backend:            "vllm",
+			ObservedGeneration: 3,
+			ProfilingResults:   "configmap/profiling-cm",
+			Deployment: &DeploymentStatus{
+				Name:      "my-dgd",
+				Namespace: "prod",
+				State:     "initializing",
+				Created:   true,
+			},
+		},
+	}
+}
+
+// newV1beta1DGDR builds a fully-populated v1beta1 DGDR for use in tests.
+func newV1beta1DGDR() *v1beta1.DynamoGraphDeploymentRequest {
+	ttft := float64(300)
+	itl := float64(15)
+	isl := int32(1024)
+	osl := int32(256)
+
+	rawDGD, _ := json.Marshal(map[string]interface{}{"apiVersion": "nvidia.com/v1alpha1", "kind": "DynamoGraphDeployment"})
+
+	return &v1beta1.DynamoGraphDeploymentRequest{
+		ObjectMeta: metav1.ObjectMeta{
+			Name:      "hub-dgdr",
+			Namespace: "default",
+		},
+		Spec: v1beta1.DynamoGraphDeploymentRequestSpec{
+			Model:     "Qwen/Qwen3-32B",
+			Backend:   v1beta1.BackendTypeVllm,
+			AutoApply: false,
+			Image:     "nvcr.io/nvidia/dynamo:0.3.2",
+			SLA: &v1beta1.SLASpec{
+				TTFT: &ttft,
+				ITL:  &itl,
+			},
+			Workload: &v1beta1.WorkloadSpec{
+				ISL: &isl,
+				OSL: &osl,
+			},
+			ModelCache: &v1beta1.ModelCacheSpec{
+				PVCName:      "qwen-pvc",
+				PVCModelPath: "qwen3-32b",
+				PVCMountPath: "/models",
+			},
+			Features: &v1beta1.FeaturesSpec{
+				Mocker: &v1beta1.MockerSpec{Enabled: true},
+			},
+		},
+		Status: v1beta1.DynamoGraphDeploymentRequestStatus{
+			Phase:              v1beta1.DGDRPhaseDeployed,
+			ObservedGeneration: 2,
+			DGDName:            "hub-dgd",
+			ProfilingJobName:   "profiling-job-1",
+			ProfilingResults: &v1beta1.ProfilingResultsStatus{
+				SelectedConfig: &runtime.RawExtension{Raw: rawDGD},
+			},
+		},
+	}
+}
+
+// TestConvertTo_SpecFields verifies that key v1alpha1 spec fields land in the correct v1beta1 locations.
+func TestConvertTo_SpecFields(t *testing.T) {
+	src := newV1alpha1DGDR()
+	dst := &v1beta1.DynamoGraphDeploymentRequest{}
+
+	if err := src.ConvertTo(dst); err != nil {
+		t.Fatalf("ConvertTo() error = %v", err)
+	}
+
+	// Simple 1:1 fields
+	if dst.Spec.Model != src.Spec.Model {
+		t.Errorf("Model: got %q, want %q", dst.Spec.Model, src.Spec.Model)
+	}
+	if string(dst.Spec.Backend) != src.Spec.Backend {
+		t.Errorf("Backend: got %q, want %q", dst.Spec.Backend, src.Spec.Backend)
+	}
+	if dst.Spec.AutoApply != src.Spec.AutoApply {
+		t.Errorf("AutoApply: got %v, want %v", dst.Spec.AutoApply, src.Spec.AutoApply)
+	}
+
+	// ProfilerImage → Image
+	if dst.Spec.Image != src.Spec.ProfilingConfig.ProfilerImage {
+		t.Errorf("Image: got %q, want %q", dst.Spec.Image, src.Spec.ProfilingConfig.ProfilerImage)
+	}
+
+	// UseMocker → Features.Mocker.Enabled
+	if dst.Spec.Features == nil || dst.Spec.Features.Mocker == nil {
+		t.Fatal("Features.Mocker is nil")
+	}
+	if !dst.Spec.Features.Mocker.Enabled {
+		t.Error("Features.Mocker.Enabled: got false, want true")
+	}
+
+	// SLA from JSON blob
+	if dst.Spec.SLA == nil {
+		t.Fatal("SLA is nil")
+	}
+	if dst.Spec.SLA.TTFT == nil || *dst.Spec.SLA.TTFT != 500 {
+		t.Errorf("SLA.TTFT: got %v, want 500", dst.Spec.SLA.TTFT)
+	}
+	if dst.Spec.SLA.ITL == nil || *dst.Spec.SLA.ITL != 20 {
+		t.Errorf("SLA.ITL: got %v, want 20", dst.Spec.SLA.ITL)
+	}
+
+	// Workload from JSON blob
+	if dst.Spec.Workload == nil {
+		t.Fatal("Workload is nil")
+	}
+	if dst.Spec.Workload.ISL == nil || *dst.Spec.Workload.ISL != 2048 {
+		t.Errorf("Workload.ISL: got %v, want 2048", dst.Spec.Workload.ISL)
+	}
+	if dst.Spec.Workload.OSL == nil || *dst.Spec.Workload.OSL != 512 {
+		t.Errorf("Workload.OSL: got %v, want 512", dst.Spec.Workload.OSL)
+	}
+
+	// ModelCache from JSON blob
+	if dst.Spec.ModelCache == nil {
+		t.Fatal("ModelCache is nil")
+	}
+	if dst.Spec.ModelCache.PVCName != "model-pvc" {
+		t.Errorf("ModelCache.PVCName: got %q, want %q", dst.Spec.ModelCache.PVCName, "model-pvc")
+	}
+	if dst.Spec.ModelCache.PVCModelPath != "llama-3" {
+		t.Errorf("ModelCache.PVCModelPath: got %q, want %q", dst.Spec.ModelCache.PVCModelPath, "llama-3")
+	}
+	if dst.Spec.ModelCache.PVCMountPath != "/data/model" {
+		t.Errorf("ModelCache.PVCMountPath: got %q, want %q", dst.Spec.ModelCache.PVCMountPath, "/data/model")
+	}
+
+	// EnableGPUDiscovery → annotation
+	if dst.Annotations[annDGDREnableGPUDisc] != "true" {
+		t.Errorf("annDGDREnableGPUDisc annotation: got %q, want %q", dst.Annotations[annDGDREnableGPUDisc], "true")
+	}
+
+	// OutputPVC → annotation
+	if dst.Annotations[annDGDROutputPVC] != "output-pvc" {
+		t.Errorf("annDGDROutputPVC annotation: got %q, want %q", dst.Annotations[annDGDROutputPVC], "output-pvc")
+	}
+
+	// DeploymentOverrides → annotation
+	if dst.Annotations[annDGDRDeployOverrides] == "" {
+		t.Error("annDGDRDeployOverrides annotation is empty")
+	}
+}
+
+// TestConvertTo_StatusFields verifies that key v1alpha1 status fields land in the correct v1beta1 locations.
+func TestConvertTo_StatusFields(t *testing.T) {
+	src := newV1alpha1DGDR()
+	dst := &v1beta1.DynamoGraphDeploymentRequest{}
+
+	if err := src.ConvertTo(dst); err != nil {
+		t.Fatalf("ConvertTo() error = %v", err)
+	}
+
+	// Profiling state → Profiling phase
+	if dst.Status.Phase != v1beta1.DGDRPhaseProfiling {
+		t.Errorf("Status.Phase: got %q, want %q", dst.Status.Phase, v1beta1.DGDRPhaseProfiling)
+	}
+	if dst.Status.ObservedGeneration != 3 {
+		t.Errorf("Status.ObservedGeneration: got %d, want 3", dst.Status.ObservedGeneration)
+	}
+
+	// Deployment.Name → DGDName
+	if dst.Status.DGDName != "my-dgd" {
+		t.Errorf("Status.DGDName: got %q, want %q", dst.Status.DGDName, "my-dgd")
+	}
+
+	// Backend → annotation
+	if dst.Annotations[annDGDRStatusBackend] != "vllm" {
+		t.Errorf("annDGDRStatusBackend annotation: got %q, want %q", dst.Annotations[annDGDRStatusBackend], "vllm")
+	}
+
+	// ProfilingResults → annotation
+	if dst.Annotations[annDGDRProfilingResults] != "configmap/profiling-cm" {
+		t.Errorf("annDGDRProfilingResults annotation: got %q, want %q", dst.Annotations[annDGDRProfilingResults], "configmap/profiling-cm")
+	}
+}
+
+// TestAlpha1RoundTrip verifies v1alpha1 → v1beta1 → v1alpha1 preserves all round-tripped fields.
+func TestAlpha1RoundTrip(t *testing.T) {
+	original := newV1alpha1DGDR()
+
+	// Step 1: v1alpha1 → v1beta1
+	hub := &v1beta1.DynamoGraphDeploymentRequest{}
+	if err := original.ConvertTo(hub); err != nil {
+		t.Fatalf("ConvertTo() error = %v", err)
+	}
+
+	// Step 2: v1beta1 → v1alpha1
+	restored := &DynamoGraphDeploymentRequest{}
+	if err := restored.ConvertFrom(hub); err != nil {
+		t.Fatalf("ConvertFrom() error = %v", err)
+	}
+
+	// --- Spec checks ---
+	if restored.Spec.Model != original.Spec.Model {
+		t.Errorf("Spec.Model: got %q, want %q", restored.Spec.Model, original.Spec.Model)
+	}
+	if restored.Spec.Backend != original.Spec.Backend {
+		t.Errorf("Spec.Backend: got %q, want %q", restored.Spec.Backend, original.Spec.Backend)
+	}
+	if restored.Spec.AutoApply != original.Spec.AutoApply {
+		t.Errorf("Spec.AutoApply: got %v, want %v", restored.Spec.AutoApply, original.Spec.AutoApply)
+	}
+	if restored.Spec.UseMocker != original.Spec.UseMocker {
+		t.Errorf("Spec.UseMocker: got %v, want %v", restored.Spec.UseMocker, original.Spec.UseMocker)
+	}
+	if restored.Spec.ProfilingConfig.ProfilerImage != original.Spec.ProfilingConfig.ProfilerImage {
+		t.Errorf("ProfilingConfig.ProfilerImage: got %q, want %q", restored.Spec.ProfilingConfig.ProfilerImage, original.Spec.ProfilingConfig.ProfilerImage)
+	}
+	if restored.Spec.ProfilingConfig.OutputPVC != original.Spec.ProfilingConfig.OutputPVC {
+		t.Errorf("ProfilingConfig.OutputPVC: got %q, want %q", restored.Spec.ProfilingConfig.OutputPVC, original.Spec.ProfilingConfig.OutputPVC)
+	}
+
+	// ConfigMapRef round-trip
+	if restored.Spec.ProfilingConfig.ConfigMapRef == nil {
+		t.Fatal("ProfilingConfig.ConfigMapRef is nil after round-trip")
+	}
+	if restored.Spec.ProfilingConfig.ConfigMapRef.Name != original.Spec.ProfilingConfig.ConfigMapRef.Name {
+		t.Errorf("ConfigMapRef.Name: got %q, want %q", restored.Spec.ProfilingConfig.ConfigMapRef.Name, original.Spec.ProfilingConfig.ConfigMapRef.Name)
+	}
+
+	// EnableGPUDiscovery round-trip
+	if restored.Spec.EnableGPUDiscovery == nil || !*restored.Spec.EnableGPUDiscovery {
+		t.Error("Spec.EnableGPUDiscovery: expected true after round-trip")
+	}
+
+	// DeploymentOverrides round-trip
+	if restored.Spec.DeploymentOverrides == nil {
+		t.Fatal("Spec.DeploymentOverrides is nil after round-trip")
+	}
+	if restored.Spec.DeploymentOverrides.Name != original.Spec.DeploymentOverrides.Name {
+		t.Errorf("DeploymentOverrides.Name: got %q, want %q", restored.Spec.DeploymentOverrides.Name, original.Spec.DeploymentOverrides.Name)
+	}
+
+	// JSON blob round-trip: SLA fields re-emerge in ProfilingConfig.Config
+	if restored.Spec.ProfilingConfig.Config == nil {
+		t.Fatal("ProfilingConfig.Config is nil after round-trip")
+	}
+	var blob map[string]interface{}
+	if err := json.Unmarshal(restored.Spec.ProfilingConfig.Config.Raw, &blob); err != nil {
+		t.Fatalf("failed to unmarshal restored ProfilingConfig.Config: %v", err)
+	}
+	slaMap, _ := blob["sla"].(map[string]interface{})
+	if slaMap == nil {
+		t.Fatal("sla key missing in restored JSON blob")
+	}
+	if slaMap["ttft"] != float64(500) {
+		t.Errorf("blob sla.ttft: got %v, want 500", slaMap["ttft"])
+	}
+	if slaMap["isl"] != float64(2048) {
+		t.Errorf("blob sla.isl: got %v, want 2048", slaMap["isl"])
+	}
+	// Verify unknown keys are preserved via the annotation round-trip
+	if blob["extra_key"] != "preserved" {
+		t.Errorf("extra_key: got %v, want %q", blob["extra_key"], "preserved")
+	}
+
+	// --- Status checks ---
+	if restored.Status.State != original.Status.State {
+		t.Errorf("Status.State: got %q, want %q", restored.Status.State, original.Status.State)
+	}
+	if restored.Status.ObservedGeneration != original.Status.ObservedGeneration {
+		t.Errorf("Status.ObservedGeneration: got %d, want %d", restored.Status.ObservedGeneration, original.Status.ObservedGeneration)
+	}
+	if restored.Status.Backend != original.Status.Backend {
+		t.Errorf("Status.Backend: got %q, want %q", restored.Status.Backend, original.Status.Backend)
+	}
+	if restored.Status.ProfilingResults != original.Status.ProfilingResults {
+		t.Errorf("Status.ProfilingResults: got %q, want %q", restored.Status.ProfilingResults, original.Status.ProfilingResults)
+	}
+	if restored.Status.Deployment == nil {
+		t.Fatal("Status.Deployment is nil after round-trip")
+	}
+	if restored.Status.Deployment.Name != original.Status.Deployment.Name {
+		t.Errorf("Status.Deployment.Name: got %q, want %q", restored.Status.Deployment.Name, original.Status.Deployment.Name)
+	}
+	if restored.Status.Deployment.Created != original.Status.Deployment.Created {
+		t.Errorf("Status.Deployment.Created: got %v, want %v", restored.Status.Deployment.Created, original.Status.Deployment.Created)
+	}
+}
+
+// TestHubRoundTrip verifies v1beta1 → v1alpha1 → v1beta1 preserves all round-tripped fields.
+func TestHubRoundTrip(t *testing.T) {
+	original := newV1beta1DGDR()
+
+	// Step 1: v1beta1 → v1alpha1
+	spoke := &DynamoGraphDeploymentRequest{}
+	if err := spoke.ConvertFrom(original); err != nil {
+		t.Fatalf("ConvertFrom() error = %v", err)
+	}
+
+	// Step 2: v1alpha1 → v1beta1
+	restored := &v1beta1.DynamoGraphDeploymentRequest{}
+	if err := spoke.ConvertTo(restored); err != nil {
+		t.Fatalf("ConvertTo() error = %v", err)
+	}
+
+	// --- Spec checks ---
+	if restored.Spec.Model != original.Spec.Model {
+		t.Errorf("Spec.Model: got %q, want %q", restored.Spec.Model, original.Spec.Model)
+	}
+	if restored.Spec.Backend != original.Spec.Backend {
+		t.Errorf("Spec.Backend: got %q, want %q", restored.Spec.Backend, original.Spec.Backend)
+	}
+	if restored.Spec.AutoApply != original.Spec.AutoApply {
+		t.Errorf("Spec.AutoApply: got %v, want %v", restored.Spec.AutoApply, original.Spec.AutoApply)
+	}
+	if restored.Spec.Image != original.Spec.Image {
+		t.Errorf("Spec.Image: got %q, want %q", restored.Spec.Image, original.Spec.Image)
+	}
+
+	// UseMocker round-trip via Features.Mocker.Enabled
+	if restored.Spec.Features == nil || restored.Spec.Features.Mocker == nil {
+		t.Fatal("Spec.Features.Mocker is nil after round-trip")
+	}
+	if restored.Spec.Features.Mocker.Enabled != original.Spec.Features.Mocker.Enabled {
+		t.Errorf("Features.Mocker.Enabled: got %v, want %v", restored.Spec.Features.Mocker.Enabled, original.Spec.Features.Mocker.Enabled)
+	}
+
+	// SLA round-trip via JSON blob
+	if restored.Spec.SLA == nil {
+		t.Fatal("Spec.SLA is nil after round-trip")
+	}
+	if restored.Spec.SLA.TTFT == nil || *restored.Spec.SLA.TTFT != *original.Spec.SLA.TTFT {
+		t.Errorf("SLA.TTFT: got %v, want %v", restored.Spec.SLA.TTFT, original.Spec.SLA.TTFT)
+	}
+	if restored.Spec.SLA.ITL == nil || *restored.Spec.SLA.ITL != *original.Spec.SLA.ITL {
+		t.Errorf("SLA.ITL: got %v, want %v", restored.Spec.SLA.ITL, original.Spec.SLA.ITL)
+	}
+
+	// Workload round-trip via JSON blob
+	if restored.Spec.Workload == nil {
+		t.Fatal("Spec.Workload is nil after round-trip")
+	}
+	if restored.Spec.Workload.ISL == nil || *restored.Spec.Workload.ISL != *original.Spec.Workload.ISL {
+		t.Errorf("Workload.ISL: got %v, want %v", restored.Spec.Workload.ISL, original.Spec.Workload.ISL)
+	}
+	if restored.Spec.Workload.OSL == nil || *restored.Spec.Workload.OSL != *original.Spec.Workload.OSL {
+		t.Errorf("Workload.OSL: got %v, want %v", restored.Spec.Workload.OSL, original.Spec.Workload.OSL)
+	}
+
+	// ModelCache round-trip via JSON blob
+	if restored.Spec.ModelCache == nil {
+		t.Fatal("Spec.ModelCache is nil after round-trip")
+	}
+	if restored.Spec.ModelCache.PVCName != original.Spec.ModelCache.PVCName {
+		t.Errorf("ModelCache.PVCName: got %q, want %q", restored.Spec.ModelCache.PVCName, original.Spec.ModelCache.PVCName)
+	}
+	if restored.Spec.ModelCache.PVCModelPath != original.Spec.ModelCache.PVCModelPath {
+		t.Errorf("ModelCache.PVCModelPath: got %q, want %q", restored.Spec.ModelCache.PVCModelPath, original.Spec.ModelCache.PVCModelPath)
+	}
+	if restored.Spec.ModelCache.PVCMountPath != original.Spec.ModelCache.PVCMountPath {
+		t.Errorf("ModelCache.PVCMountPath: got %q, want %q", restored.Spec.ModelCache.PVCMountPath, original.Spec.ModelCache.PVCMountPath)
+	}
+
+	// --- Status checks ---
+	// Deployed → Ready (lossy: v1alpha1 has no "Deployed" state; maps to "Ready")
+	// then on the way back Ready→Ready
+	if restored.Status.Phase != v1beta1.DGDRPhaseReady {
+		t.Errorf("Status.Phase: got %q, want %q (Deployed→Ready is lossy)", restored.Status.Phase, v1beta1.DGDRPhaseReady)
+	}
+	if restored.Status.ObservedGeneration != original.Status.ObservedGeneration {
+		t.Errorf("Status.ObservedGeneration: got %d, want %d", restored.Status.ObservedGeneration, original.Status.ObservedGeneration)
+	}
+	// DGDName round-trip
+	if restored.Status.DGDName != original.Status.DGDName {
+		t.Errorf("Status.DGDName: got %q, want %q", restored.Status.DGDName, original.Status.DGDName)
+	}
+	// ProfilingJobName round-trip via annotation
+	if restored.Status.ProfilingJobName != original.Status.ProfilingJobName {
+		t.Errorf("Status.ProfilingJobName: got %q, want %q", restored.Status.ProfilingJobName, original.Status.ProfilingJobName)
+	}
+	// GeneratedDeployment round-trip via ProfilingResults.SelectedConfig
+	if restored.Status.ProfilingResults == nil || restored.Status.ProfilingResults.SelectedConfig == nil {
+		t.Fatal("Status.ProfilingResults.SelectedConfig is nil after round-trip")
+	}
+}
+
+// TestConvertTo_InvalidProfilingConfigJSON verifies that malformed JSON in ProfilingConfig.Config
+// returns an error rather than silently producing an incomplete conversion.
+func TestConvertTo_InvalidProfilingConfigJSON(t *testing.T) {
+	src := newV1alpha1DGDR()
+	src.Spec.ProfilingConfig.Config = &apiextensionsv1.JSON{Raw: []byte(`{not valid json`)}
+
+	dst := &v1beta1.DynamoGraphDeploymentRequest{}
+	err := src.ConvertTo(dst)
+	if err == nil {
+		t.Fatal("ConvertTo() expected error for invalid JSON, got nil")
+	}
+}
--- a/deploy/operator/api/v1alpha1/dynamographdeploymentrequest_types.go
+++ b/deploy/operator/api/v1alpha1/dynamographdeploymentrequest_types.go
@@ -273,9 +273,15 @@ type DynamoGraphDeploymentRequestStatus struct {
 // The spec becomes immutable once profiling starts. Users must delete and recreate
 // the DGDR to modify configuration after this point.
 //
+// DEPRECATION NOTICE: v1alpha1 DynamoGraphDeploymentRequest is deprecated.
+// Please migrate to nvidia.com/v1beta1 DynamoGraphDeploymentRequest.
+// v1alpha1 will be removed in a future release.
+//
 // +kubebuilder:object:root=true
 // +kubebuilder:subresource:status
+// +kubebuilder:storageversion
 // +kubebuilder:resource:shortName=dgdr
+// +kubebuilder:deprecatedversion:warning="nvidia.com/v1alpha1 DynamoGraphDeploymentRequest is deprecated; use nvidia.com/v1beta1 DynamoGraphDeploymentRequest"
 // +kubebuilder:printcolumn:name="Model",type=string,JSONPath=`.spec.model`
 // +kubebuilder:printcolumn:name="Backend",type=string,JSONPath=`.status.backend`
 // +kubebuilder:printcolumn:name="State",type=string,JSONPath=`.status.state`

--- a/deploy/operator/api/v1beta1/dynamographdeploymentrequest_conversion.go
+++ b/deploy/operator/api/v1beta1/dynamographdeploymentrequest_conversion.go
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: Apache-2.0
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package v1beta1
+
+import (
+	"sigs.k8s.io/controller-runtime/pkg/conversion"
+)
+
+// Hub marks v1beta1 as the conversion hub for all DGDR versions.
+// All other versions (v1alpha1, future versions) convert through v1beta1.
+func (*DynamoGraphDeploymentRequest) Hub() {}
+
+// Ensure v1beta1 implements the Hub interface.
+var _ conversion.Hub = &DynamoGraphDeploymentRequest{}
--- a/deploy/operator/api/v1beta1/dynamographdeploymentrequest_types.go
+++ b/deploy/operator/api/v1beta1/dynamographdeploymentrequest_types.go
--- a/deploy/operator/api/v1beta1/groupversion_info.go
+++ b/deploy/operator/api/v1beta1/groupversion_info.go
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: Apache-2.0
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+// Package v1beta1 contains API Schema definitions for the nvidia.com v1beta1 API group.
+// +kubebuilder:object:generate=true
+// +groupName=nvidia.com
+package v1beta1
+
+import (
+	"k8s.io/apimachinery/pkg/runtime/schema"
+	"sigs.k8s.io/controller-runtime/pkg/scheme"
+)
+
+var (
+	// GroupVersion is group version used to register these objects
+	GroupVersion = schema.GroupVersion{Group: "nvidia.com", Version: "v1beta1"}
+
+	// SchemeBuilder is used to add go types to the GroupVersionKind scheme
+	SchemeBuilder = &scheme.Builder{GroupVersion: GroupVersion}
+
+	// AddToScheme adds the types in this group-version to the given scheme.
+	AddToScheme = SchemeBuilder.AddToScheme
+)
--- a/deploy/operator/api/v1beta1/zz_generated.deepcopy.go
+++ b/deploy/operator/api/v1beta1/zz_generated.deepcopy.go
+//go:build !ignore_autogenerated
+
+/*
+SPDX-FileCopyrightText: Copyright (c) 2024-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+SPDX-License-Identifier: Apache-2.0
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+/*
+Copyright 2024.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+// Code generated by controller-gen. DO NOT EDIT.
+
+package v1beta1
+
+import (
+	"k8s.io/api/batch/v1"
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	"k8s.io/apimachinery/pkg/runtime"
+)
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *DeploymentInfoStatus) DeepCopyInto(out *DeploymentInfoStatus) {
+	*out = *in
+	if in.Replicas != nil {
+		in, out := &in.Replicas, &out.Replicas
+		*out = new(int32)
+		**out = **in
+	}
+	if in.AvailableReplicas != nil {
+		in, out := &in.AvailableReplicas, &out.AvailableReplicas
+		*out = new(int32)
+		**out = **in
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new DeploymentInfoStatus.
+func (in *DeploymentInfoStatus) DeepCopy() *DeploymentInfoStatus {
+	if in == nil {
+		return nil
+	}
+	out := new(DeploymentInfoStatus)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *DynamoGraphDeploymentRequest) DeepCopyInto(out *DynamoGraphDeploymentRequest) {
+	*out = *in
+	out.TypeMeta = in.TypeMeta
+	in.ObjectMeta.DeepCopyInto(&out.ObjectMeta)
+	in.Spec.DeepCopyInto(&out.Spec)
+	in.Status.DeepCopyInto(&out.Status)
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new DynamoGraphDeploymentRequest.
+func (in *DynamoGraphDeploymentRequest) DeepCopy() *DynamoGraphDeploymentRequest {
+	if in == nil {
+		return nil
+	}
+	out := new(DynamoGraphDeploymentRequest)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyObject is an autogenerated deepcopy function, copying the receiver, creating a new runtime.Object.
+func (in *DynamoGraphDeploymentRequest) DeepCopyObject() runtime.Object {
+	if c := in.DeepCopy(); c != nil {
+		return c
+	}
+	return nil
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *DynamoGraphDeploymentRequestList) DeepCopyInto(out *DynamoGraphDeploymentRequestList) {
+	*out = *in
+	out.TypeMeta = in.TypeMeta
+	in.ListMeta.DeepCopyInto(&out.ListMeta)
+	if in.Items != nil {
+		in, out := &in.Items, &out.Items
+		*out = make([]DynamoGraphDeploymentRequest, len(*in))
+		for i := range *in {
+			(*in)[i].DeepCopyInto(&(*out)[i])
+		}
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new DynamoGraphDeploymentRequestList.
+func (in *DynamoGraphDeploymentRequestList) DeepCopy() *DynamoGraphDeploymentRequestList {
+	if in == nil {
+		return nil
+	}
+	out := new(DynamoGraphDeploymentRequestList)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyObject is an autogenerated deepcopy function, copying the receiver, creating a new runtime.Object.
+func (in *DynamoGraphDeploymentRequestList) DeepCopyObject() runtime.Object {
+	if c := in.DeepCopy(); c != nil {
+		return c
+	}
+	return nil
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *DynamoGraphDeploymentRequestSpec) DeepCopyInto(out *DynamoGraphDeploymentRequestSpec) {
+	*out = *in
+	if in.ModelCache != nil {
+		in, out := &in.ModelCache, &out.ModelCache
+		*out = new(ModelCacheSpec)
+		**out = **in
+	}
+	if in.Hardware != nil {
+		in, out := &in.Hardware, &out.Hardware
+		*out = new(HardwareSpec)
+		(*in).DeepCopyInto(*out)
+	}
+	if in.Workload != nil {
+		in, out := &in.Workload, &out.Workload
+		*out = new(WorkloadSpec)
+		(*in).DeepCopyInto(*out)
+	}
+	if in.SLA != nil {
+		in, out := &in.SLA, &out.SLA
+		*out = new(SLASpec)
+		(*in).DeepCopyInto(*out)
+	}
+	if in.Overrides != nil {
+		in, out := &in.Overrides, &out.Overrides
+		*out = new(OverridesSpec)
+		(*in).DeepCopyInto(*out)
+	}
+	if in.Features != nil {
+		in, out := &in.Features, &out.Features
+		*out = new(FeaturesSpec)
+		(*in).DeepCopyInto(*out)
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new DynamoGraphDeploymentRequestSpec.
+func (in *DynamoGraphDeploymentRequestSpec) DeepCopy() *DynamoGraphDeploymentRequestSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(DynamoGraphDeploymentRequestSpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *DynamoGraphDeploymentRequestStatus) DeepCopyInto(out *DynamoGraphDeploymentRequestStatus) {
+	*out = *in
+	if in.Conditions != nil {
+		in, out := &in.Conditions, &out.Conditions
+		*out = make([]metav1.Condition, len(*in))
+		for i := range *in {
+			(*in)[i].DeepCopyInto(&(*out)[i])
+		}
+	}
+	if in.ProfilingResults != nil {
+		in, out := &in.ProfilingResults, &out.ProfilingResults
+		*out = new(ProfilingResultsStatus)
+		(*in).DeepCopyInto(*out)
+	}
+	if in.DeploymentInfo != nil {
+		in, out := &in.DeploymentInfo, &out.DeploymentInfo
+		*out = new(DeploymentInfoStatus)
+		(*in).DeepCopyInto(*out)
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new DynamoGraphDeploymentRequestStatus.
+func (in *DynamoGraphDeploymentRequestStatus) DeepCopy() *DynamoGraphDeploymentRequestStatus {
+	if in == nil {
+		return nil
+	}
+	out := new(DynamoGraphDeploymentRequestStatus)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *FeaturesSpec) DeepCopyInto(out *FeaturesSpec) {
+	*out = *in
+	if in.Planner != nil {
+		in, out := &in.Planner, &out.Planner
+		*out = new(PlannerSpec)
+		(*in).DeepCopyInto(*out)
+	}
+	if in.Mocker != nil {
+		in, out := &in.Mocker, &out.Mocker
+		*out = new(MockerSpec)
+		**out = **in
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new FeaturesSpec.
+func (in *FeaturesSpec) DeepCopy() *FeaturesSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(FeaturesSpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *HardwareSpec) DeepCopyInto(out *HardwareSpec) {
+	*out = *in
+	if in.VRAMMB != nil {
+		in, out := &in.VRAMMB, &out.VRAMMB
+		*out = new(float64)
+		**out = **in
+	}
+	if in.TotalGPUs != nil {
+		in, out := &in.TotalGPUs, &out.TotalGPUs
+		*out = new(int32)
+		**out = **in
+	}
+	if in.NumGPUsPerNode != nil {
+		in, out := &in.NumGPUsPerNode, &out.NumGPUsPerNode
+		*out = new(int32)
+		**out = **in
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new HardwareSpec.
+func (in *HardwareSpec) DeepCopy() *HardwareSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(HardwareSpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *KVRouterSpec) DeepCopyInto(out *KVRouterSpec) {
+	*out = *in
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new KVRouterSpec.
+func (in *KVRouterSpec) DeepCopy() *KVRouterSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(KVRouterSpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *MockerSpec) DeepCopyInto(out *MockerSpec) {
+	*out = *in
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new MockerSpec.
+func (in *MockerSpec) DeepCopy() *MockerSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(MockerSpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *ModelCacheSpec) DeepCopyInto(out *ModelCacheSpec) {
+	*out = *in
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ModelCacheSpec.
+func (in *ModelCacheSpec) DeepCopy() *ModelCacheSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(ModelCacheSpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *OverridesSpec) DeepCopyInto(out *OverridesSpec) {
+	*out = *in
+	if in.ProfilingJob != nil {
+		in, out := &in.ProfilingJob, &out.ProfilingJob
+		*out = new(v1.JobSpec)
+		(*in).DeepCopyInto(*out)
+	}
+	if in.DGD != nil {
+		in, out := &in.DGD, &out.DGD
+		*out = new(runtime.RawExtension)
+		(*in).DeepCopyInto(*out)
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new OverridesSpec.
+func (in *OverridesSpec) DeepCopy() *OverridesSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(OverridesSpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *ParetoConfig) DeepCopyInto(out *ParetoConfig) {
+	*out = *in
+	in.Config.DeepCopyInto(&out.Config)
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ParetoConfig.
+func (in *ParetoConfig) DeepCopy() *ParetoConfig {
+	if in == nil {
+		return nil
+	}
+	out := new(ParetoConfig)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *PlannerSpec) DeepCopyInto(out *PlannerSpec) {
+	*out = *in
+	if in.PlannerPreDeploymentSweeping != nil {
+		in, out := &in.PlannerPreDeploymentSweeping, &out.PlannerPreDeploymentSweeping
+		*out = new(PlannerPreDeploymentSweepMode)
+		**out = **in
+	}
+	if in.PlannerArgsList != nil {
+		in, out := &in.PlannerArgsList, &out.PlannerArgsList
+		*out = make([]string, len(*in))
+		copy(*out, *in)
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new PlannerSpec.
+func (in *PlannerSpec) DeepCopy() *PlannerSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(PlannerSpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *ProfilingResultsStatus) DeepCopyInto(out *ProfilingResultsStatus) {
+	*out = *in
+	if in.Pareto != nil {
+		in, out := &in.Pareto, &out.Pareto
+		*out = make([]ParetoConfig, len(*in))
+		for i := range *in {
+			(*in)[i].DeepCopyInto(&(*out)[i])
+		}
+	}
+	if in.SelectedConfig != nil {
+		in, out := &in.SelectedConfig, &out.SelectedConfig
+		*out = new(runtime.RawExtension)
+		(*in).DeepCopyInto(*out)
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ProfilingResultsStatus.
+func (in *ProfilingResultsStatus) DeepCopy() *ProfilingResultsStatus {
+	if in == nil {
+		return nil
+	}
+	out := new(ProfilingResultsStatus)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *SLASpec) DeepCopyInto(out *SLASpec) {
+	*out = *in
+	if in.TTFT != nil {
+		in, out := &in.TTFT, &out.TTFT
+		*out = new(float64)
+		**out = **in
+	}
+	if in.ITL != nil {
+		in, out := &in.ITL, &out.ITL
+		*out = new(float64)
+		**out = **in
+	}
+	if in.E2ELatency != nil {
+		in, out := &in.E2ELatency, &out.E2ELatency
+		*out = new(float64)
+		**out = **in
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new SLASpec.
+func (in *SLASpec) DeepCopy() *SLASpec {
+	if in == nil {
+		return nil
+	}
+	out := new(SLASpec)
+	in.DeepCopyInto(out)
+	return out
+}
+
+// DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
+func (in *WorkloadSpec) DeepCopyInto(out *WorkloadSpec) {
+	*out = *in
+	if in.ISL != nil {
+		in, out := &in.ISL, &out.ISL
+		*out = new(int32)
+		**out = **in
+	}
+	if in.OSL != nil {
+		in, out := &in.OSL, &out.OSL
+		*out = new(int32)
+		**out = **in
+	}
+	if in.Concurrency != nil {
+		in, out := &in.Concurrency, &out.Concurrency
+		*out = new(float64)
+		**out = **in
+	}
+	if in.RequestRate != nil {
+		in, out := &in.RequestRate, &out.RequestRate
+		*out = new(float64)
+		**out = **in
+	}
+}
+
+// DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new WorkloadSpec.
+func (in *WorkloadSpec) DeepCopy() *WorkloadSpec {
+	if in == nil {
+		return nil
+	}
+	out := new(WorkloadSpec)
+	in.DeepCopyInto(out)
+	return out
+}
--- a/deploy/operator/cmd/main.go
+++ b/deploy/operator/cmd/main.go
@@ -56,6 +56,7 @@ import (

 	semver "github.com/Masterminds/semver/v3"
 	nvidiacomv1alpha1 "github.com/ai-dynamo/dynamo/deploy/operator/api/v1alpha1"
+	nvidiacomv1beta1 "github.com/ai-dynamo/dynamo/deploy/operator/api/v1beta1"
 	"github.com/ai-dynamo/dynamo/deploy/operator/internal/consts"
 	"github.com/ai-dynamo/dynamo/deploy/operator/internal/controller"
 	commonController "github.com/ai-dynamo/dynamo/deploy/operator/internal/controller_common"
@@ -123,6 +124,7 @@ func init() {
 	utilruntime.Must(istioclientsetscheme.AddToScheme(scheme))

 	utilruntime.Must(gaiev1.Install(scheme))
+	utilruntime.Must(nvidiacomv1beta1.AddToScheme(scheme))
 	//+kubebuilder:scaffold:scheme
 }

@@ -744,6 +746,13 @@ func main() {
 			os.Exit(1)
 		}

+		if err = ctrl.NewWebhookManagedBy(mgr).
+			For(&nvidiacomv1alpha1.DynamoGraphDeploymentRequest{}).
+			Complete(); err != nil {
+			setupLog.Error(err, "unable to register conversion webhook", "webhook", "DynamoGraphDeploymentRequest-conversion")
+			os.Exit(1)
+		}
+
 		setupLog.Info("Validation webhooks registered successfully")

 		// Register defaulting (mutating) webhook handlers

--- a/deploy/operator/config/crd/bases/nvidia.com_dynamographdeploymentrequests.yaml
+++ b/deploy/operator/config/crd/bases/nvidia.com_dynamographdeploymentrequests.yaml
--- a/deploy/operator/docs/fix-api-anchors.py
+++ b/deploy/operator/docs/fix-api-anchors.py
+# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Post-process api-reference.md to deduplicate anchors between v1alpha1 and v1beta1.
+
+crd-ref-docs generates anchors solely from type names, so types that exist in both
+API versions get identical anchors (e.g. #dynamographdeploymentrequest). In standard
+Markdown renderers the first occurrence wins, meaning v1beta1 links resolve to the
+v1alpha1 section. This script prepends "v1beta1 " to the affected headings in the
+v1beta1 section and updates all intra-section links to match the new anchors.
+"""
+import re
+import sys
+
+if len(sys.argv) != 2:
+    print(f"Usage: {sys.argv[0]} <api-reference.md>", file=sys.stderr)
+    sys.exit(1)
+
+path = sys.argv[1]
+content = open(path).read()
+
+marker = "## nvidia.com/v1beta1"
+idx = content.find(marker)
+if idx == -1:
+    print("Warning: v1beta1 section not found, skipping anchor fix", file=sys.stderr)
+    sys.exit(0)
+
+alpha_part = content[:idx]
+beta_part = content[idx:]
+
+# Types whose names collide between v1alpha1 and v1beta1.
+# Add to this list if future versions introduce additional same-named types.
+duplicate_types = [
+    "DynamoGraphDeploymentRequest",
+    "DynamoGraphDeploymentRequestSpec",
+    "DynamoGraphDeploymentRequestStatus",
+]
+
+for t in duplicate_types:
+    anchor = t.lower()
+    # Rename section headings: #### TypeName → #### v1beta1 TypeName
+    beta_part = re.sub(
+        r"(####\s+)" + re.escape(t) + r"(\s*$)",
+        r"\1v1beta1 " + t + r"\2",
+        beta_part,
+        flags=re.MULTILINE,
+    )
+    # Update markdown links: (#anchor) → (#v1beta1-anchor)
+    beta_part = beta_part.replace(f"(#{anchor})", f"(#v1beta1-{anchor})")
+
+open(path, "w").write(alpha_part + beta_part)
+print(f"✅ Fixed duplicate anchors in {path}")