Unverified Commit cf55e8b8 authored by Hongkuan Zhou's avatar Hongkuan Zhou Committed by GitHub
Browse files

fix: add subcomponenttype to recipes missing this field (#5301)


Signed-off-by: default avatarhongkuanz <hongkuanz@nvidia.com>
parent ec5630ea
...@@ -26,6 +26,7 @@ spec: ...@@ -26,6 +26,7 @@ spec:
decode: decode:
dynamoNamespace: sgl-dsr1-16gpu dynamoNamespace: sgl-dsr1-16gpu
componentType: worker componentType: worker
subComponentType: decode
replicas: 1 replicas: 1
multinode: multinode:
nodeCount: 2 nodeCount: 2
...@@ -71,6 +72,7 @@ spec: ...@@ -71,6 +72,7 @@ spec:
prefill: prefill:
dynamoNamespace: sgl-dsr1-16gpu dynamoNamespace: sgl-dsr1-16gpu
componentType: worker componentType: worker
subComponentType: prefill
replicas: 1 replicas: 1
multinode: multinode:
nodeCount: 2 nodeCount: 2
......
...@@ -26,6 +26,7 @@ spec: ...@@ -26,6 +26,7 @@ spec:
decode: decode:
dynamoNamespace: sgl-dsr1-8gpu dynamoNamespace: sgl-dsr1-8gpu
componentType: worker componentType: worker
subComponentType: decode
replicas: 1 replicas: 1
resources: resources:
limits: limits:
...@@ -68,6 +69,7 @@ spec: ...@@ -68,6 +69,7 @@ spec:
prefill: prefill:
dynamoNamespace: sgl-dsr1-8gpu dynamoNamespace: sgl-dsr1-8gpu
componentType: worker componentType: worker
subComponentType: prefill
replicas: 1 replicas: 1
resources: resources:
limits: limits:
......
...@@ -139,6 +139,7 @@ spec: ...@@ -139,6 +139,7 @@ spec:
prefill: prefill:
dynamoNamespace: trtllm-disagg-multinode dynamoNamespace: trtllm-disagg-multinode
componentType: worker componentType: worker
subComponentType: prefill
replicas: 1 replicas: 1
# NOTE: Prefill uses 1 node (no multinode section = single node) # NOTE: Prefill uses 1 node (no multinode section = single node)
# and contributes to ComputeDomain.numNodes (see above) # and contributes to ComputeDomain.numNodes (see above)
...@@ -196,6 +197,7 @@ spec: ...@@ -196,6 +197,7 @@ spec:
decode: decode:
dynamoNamespace: trtllm-disagg-multinode dynamoNamespace: trtllm-disagg-multinode
componentType: worker componentType: worker
subComponentType: decode
replicas: 1 replicas: 1
volumeMounts: volumeMounts:
- name: model-cache - name: model-cache
......
...@@ -28,6 +28,7 @@ spec: ...@@ -28,6 +28,7 @@ spec:
decode: decode:
dynamoNamespace: vllm-dsr1 dynamoNamespace: vllm-dsr1
componentType: worker componentType: worker
subComponentType: decode
replicas: 1 replicas: 1
multinode: multinode:
nodeCount: 2 nodeCount: 2
...@@ -93,6 +94,7 @@ spec: ...@@ -93,6 +94,7 @@ spec:
prefill: prefill:
dynamoNamespace: vllm-dsr1 dynamoNamespace: vllm-dsr1
componentType: worker componentType: worker
subComponentType: prefill
replicas: 1 replicas: 1
multinode: multinode:
nodeCount: 2 nodeCount: 2
......
...@@ -26,6 +26,7 @@ spec: ...@@ -26,6 +26,7 @@ spec:
replicas: 1 replicas: 1
VllmPrefillWorker: VllmPrefillWorker:
componentType: worker componentType: worker
subComponentType: prefill
dynamoNamespace: llama3-70b-disagg-mn dynamoNamespace: llama3-70b-disagg-mn
envFromSecret: hf-token-secret envFromSecret: hf-token-secret
volumeMounts: volumeMounts:
...@@ -57,6 +58,7 @@ spec: ...@@ -57,6 +58,7 @@ spec:
gpu: "8" gpu: "8"
VllmDecodeWorker: VllmDecodeWorker:
componentType: worker componentType: worker
subComponentType: decode
dynamoNamespace: llama3-70b-disagg-mn dynamoNamespace: llama3-70b-disagg-mn
envFromSecret: hf-token-secret envFromSecret: hf-token-secret
volumeMounts: volumeMounts:
......
...@@ -26,6 +26,7 @@ spec: ...@@ -26,6 +26,7 @@ spec:
replicas: 1 replicas: 1
VllmPrefillWorker: VllmPrefillWorker:
componentType: worker componentType: worker
subComponentType: prefill
dynamoNamespace: llama3-70b-disagg-sn dynamoNamespace: llama3-70b-disagg-sn
envFromSecret: hf-token-secret envFromSecret: hf-token-secret
volumeMounts: volumeMounts:
...@@ -69,6 +70,7 @@ spec: ...@@ -69,6 +70,7 @@ spec:
gpu: "2" gpu: "2"
VllmDecodeWorker: VllmDecodeWorker:
componentType: worker componentType: worker
subComponentType: decode
dynamoNamespace: llama3-70b-disagg-sn dynamoNamespace: llama3-70b-disagg-sn
envFromSecret: hf-token-secret envFromSecret: hf-token-secret
volumeMounts: volumeMounts:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment