Unverified Commit 8cd94119 authored by Biswa Panda's avatar Biswa Panda Committed by GitHub
Browse files

feat: add hello world deployment example (#1854)

parent fde25fef
......@@ -31,6 +31,6 @@ Middle:
Backend:
message: "mars"
ServiceArgs:
workers: 2
workers: 1
resources:
cpu: "1"
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
apiVersion: nvidia.com/v1alpha1
kind: DynamoGraphDeployment
metadata:
name: hello-world
spec:
services:
Frontend:
dynamoNamespace: hello-world
componentType: main
replicas: 1
resources:
requests:
cpu: "1"
memory: "2Gi"
limits:
cpu: "1"
memory: "2Gi"
extraPodSpec:
mainContainer:
image: nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.3.1
workingDir: /workspace/examples/hello_world
args:
- dynamo
- serve
- hello_world:Frontend
- --system-app-port
- "5000"
- --enable-system-app
- --use-default-health-checks
- --service-name
- Frontend
- -f
- ./config.yaml
Middle:
dynamoNamespace: hello-world
replicas: 1
resources:
requests:
cpu: "1"
memory: "2Gi"
limits:
cpu: "1"
memory: "2Gi"
extraPodSpec:
mainContainer:
image: nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.3.1
workingDir: /workspace/examples/hello_world
args:
- dynamo
- serve
- hello_world:Middle
- --system-app-port
- "5000"
- --enable-system-app
- --use-default-health-checks
- --service-name
- Middle
- -f
- ./config.yaml
Backend:
dynamoNamespace: hello-world
replicas: 1
resources:
requests:
cpu: "1"
memory: "2Gi"
limits:
cpu: "1"
memory: "2Gi"
extraPodSpec:
mainContainer:
image: nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.3.1
workingDir: /workspace/examples/hello_world
args:
- dynamo
- serve
- hello_world:Backend
- --system-app-port
- "5000"
- --enable-system-app
- --use-default-health-checks
- --service-name
- Backend
- -f
- ./config.yaml
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment