"lib/runtime/vscode:/vscode.git/clone" did not exist on "7c25f702917f4199dafc4094e665fe41f4bcfe6c"
Unverified Commit af7a41c3 authored by Biswa Panda's avatar Biswa Panda Committed by GitHub
Browse files

feat: use generic image and use single node for oss-gpt-120b recipe (#3454)

parent ff625465
...@@ -30,12 +30,12 @@ spec: ...@@ -30,12 +30,12 @@ spec:
command: command:
- /bin/sh - /bin/sh
- -c - -c
image: nvcr.io/nvidia/ai-dynamo/tensorrtllm-runtime:0.5.1-rc0.pre3 image: my-registry/trtllm-runtime:my-tag
pvc: pvc:
create: false create: false
mountPoint: /model-store mountPoint: /model-store
name: model-cache name: model-cache
replicas: 18 replicas: 1
TrtllmWorker: TrtllmWorker:
componentType: main componentType: main
dynamoNamespace: gpt-oss-agg dynamoNamespace: gpt-oss-agg
...@@ -69,7 +69,7 @@ spec: ...@@ -69,7 +69,7 @@ spec:
command: command:
- /bin/sh - /bin/sh
- -c - -c
image: nvcr.io/nvidia/ai-dynamo/tensorrtllm-runtime:0.5.1-rc0.pre3 image: my-registry/trtllm-runtime:my-tag
env: env:
- name: TRTLLM_ENABLE_PDL - name: TRTLLM_ENABLE_PDL
value: "1" value: "1"
...@@ -80,7 +80,7 @@ spec: ...@@ -80,7 +80,7 @@ spec:
- name: ENGINE_ARGS - name: ENGINE_ARGS
value: "/opt/dynamo/configs/config.yaml" value: "/opt/dynamo/configs/config.yaml"
- name: MODEL_PATH - name: MODEL_PATH
value: "/model-store/models--openai--gpt-oss-120b/snapshots/b5c939de8f754692c1647ca79fbf85e8c1e70f8a" value: "/model-store/hub/models--openai--gpt-oss-120b/snapshots/b5c939de8f754692c1647ca79fbf85e8c1e70f8a"
volumeMounts: volumeMounts:
- mountPath: /opt/dynamo/configs - mountPath: /opt/dynamo/configs
name: llm-config name: llm-config
...@@ -94,7 +94,7 @@ spec: ...@@ -94,7 +94,7 @@ spec:
create: false create: false
mountPoint: /model-store mountPoint: /model-store
name: model-cache name: model-cache
replicas: 18 replicas: 1
resources: resources:
limits: limits:
gpu: "4" gpu: "4"
......
...@@ -114,7 +114,7 @@ spec: ...@@ -114,7 +114,7 @@ spec:
- name: CONCURRENCY_PER_GPU - name: CONCURRENCY_PER_GPU
value: "900" value: "900"
- name: DEPLOYMENT_GPU_COUNT - name: DEPLOYMENT_GPU_COUNT
value: "72" value: "4"
- name: ISL - name: ISL
value: "128" value: "128"
- name: OSL - name: OSL
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment