vllm_agg_qwen.yaml 745 Bytes
Newer Older
1
2
3
4
5
6
7
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0

# Default values for dynamo-gaie.
# This is a YAML-formatted file.
# Declare variables to be passed into your templates.

8
9
# Name of the DynamoGraphDeployment (DGD) backing this model deployment.
dynamoGraphDeploymentName: "vllm-agg"
10
11
12
13
14
15
16
17

# This is the port on which the model is exposed
model:
  # This is the model name that will be used to route traffic to the dynamo model
  # for example, if the model name is Qwen/Qwen3-0.6B, then the modelShortName should be qwen
  identifier: "Qwen/Qwen3-0.6B"
  # This is the short name of the model that will be used to generate the resource names
  shortName: "qwen"