Commit 678cffb4 authored by Neelay Shah's avatar Neelay Shah Committed by GitHub
Browse files
parent 6ba39b09
...@@ -17,8 +17,8 @@ Cargo.toml @ryanolson @grahamking @paulhendricks @biswapanda @tmonty12 @guanluo ...@@ -17,8 +17,8 @@ Cargo.toml @ryanolson @grahamking @paulhendricks @biswapanda @tmonty12 @guanluo
/deploy/Kubernetes/ @whoisj @hutm @biswapanda /deploy/Kubernetes/ @whoisj @hutm @biswapanda
# CI/CD # CI/CD
/.github/ @dynemo-ai/Devops @nnshah1 /.github/ @ai-dynamo/Devops @nnshah1
CODEOWNERS @dynemo-ai/Devops @nnshah1 CODEOWNERS @ai-dynamo/Devops @nnshah1
# Legal # Legal
/LICENSE @nv-anants @nvda-mesharma @glos-nv @dmitry-tokarev-nv /LICENSE @nv-anants @nvda-mesharma @glos-nv @dmitry-tokarev-nv
......
dynmo->dynamo dynmo->dynamo
dynemo->dynamo
...@@ -348,37 +348,37 @@ spec: ...@@ -348,37 +348,37 @@ spec:
- -c - -c
env: env:
{{- if gt $parallel_world 1 }} {{- if gt $parallel_world 1 }}
- name: DYNEMO_LLM_PP - name: DYNAMO_LLM_PP
value: {{ $parallel_pipeline }} value: {{ $parallel_pipeline }}
- name: DYNEMO_LLM_TP - name: DYNAMO_LLM_TP
value: {{ $parallel_tensor }} value: {{ $parallel_tensor }}
{{- end }} {{- end }}
- name: DYNEMO_NAME - name: DYNAMO_NAME
value: {{ $component_name | quote }} value: {{ $component_name | quote }}
{{- if gt (len $component_namespace) 0 }} {{- if gt (len $component_namespace) 0 }}
- name: DYNEMO_NAMESPACE - name: DYNAMO_NAMESPACE
value: {{ $component_namespace | quote }} value: {{ $component_namespace | quote }}
{{- end }} {{- end }}
{{- if ne $port_health 8000 }} {{- if ne $port_health 8000 }}
- name: DYNEMO_PORT_HEALTH - name: DYNAMO_PORT_HEALTH
value: {{ $port_health }} value: {{ $port_health }}
{{- end }} {{- end }}
{{- if ne $port_metrics 9347 }} {{- if ne $port_metrics 9347 }}
- name: DYNEMO_PORT_METRICS - name: DYNAMO_PORT_METRICS
value: {{ $port_metrics }} value: {{ $port_metrics }}
{{- end }} {{- end }}
{{- if ne $port_request 9345 }} {{- if ne $port_request 9345 }}
- name: DYNEMO_PORT_REQUEST - name: DYNAMO_PORT_REQUEST
value: {{ $port_request }} value: {{ $port_request }}
{{- end }} {{- end }}
- name: DYNEMO_RP_ETCD_URL - name: DYNAMO_RP_ETCD_URL
value: {{ $request_plane_etcd_url }} value: {{ $request_plane_etcd_url }}
- name: DYNEMO_RP_NATS_URL - name: DYNAMO_RP_NATS_URL
value: {{ $request_plane_nats_url }} value: {{ $request_plane_nats_url }}
- name: DYNEMO_RP_TIMEOUT - name: DYNAMO_RP_TIMEOUT
value: {{ $request_plane_timeout }} value: {{ $request_plane_timeout }}
{{- if gt $worker_count 1 }} {{- if gt $worker_count 1 }}
- name: DYNEMO_WORKER_COUNT - name: DYNAMO_WORKER_COUNT
value: {{ $worker_count }} value: {{ $worker_count }}
{{- end }} {{- end }}
image: {{ $container_image_name }} image: {{ $container_image_name }}
......
...@@ -6,7 +6,7 @@ domain: nvidia.com ...@@ -6,7 +6,7 @@ domain: nvidia.com
layout: layout:
- go.kubebuilder.io/v4 - go.kubebuilder.io/v4
projectName: dynamo-kubernetes-operator projectName: dynamo-kubernetes-operator
repo: github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1 repo: github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1
resources: resources:
- api: - api:
crdVersion: v1 crdVersion: v1
...@@ -14,7 +14,7 @@ resources: ...@@ -14,7 +14,7 @@ resources:
controller: true controller: true
domain: nvidia.com domain: nvidia.com
kind: DynamoNimDeployment kind: DynamoNimDeployment
path: github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1 path: github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1
version: v1alpha1 version: v1alpha1
- api: - api:
crdVersion: v1 crdVersion: v1
...@@ -22,14 +22,14 @@ resources: ...@@ -22,14 +22,14 @@ resources:
controller: true controller: true
domain: nvidia.com domain: nvidia.com
kind: DynamoNimRequest kind: DynamoNimRequest
path: github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1 path: github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1
version: v1alpha1 version: v1alpha1
- api: - api:
crdVersion: v1 crdVersion: v1
namespaced: true namespaced: true
domain: nvidia.com domain: nvidia.com
kind: DynamoNim kind: DynamoNim
path: github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1 path: github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1
version: v1alpha1 version: v1alpha1
- api: - api:
crdVersion: v1 crdVersion: v1
...@@ -37,6 +37,6 @@ resources: ...@@ -37,6 +37,6 @@ resources:
controller: true controller: true
domain: nvidia.com domain: nvidia.com
kind: DynamoDeployment kind: DynamoDeployment
path: github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1 path: github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1
version: v1alpha1 version: v1alpha1
version: "3" version: "3"
...@@ -21,12 +21,12 @@ import ( ...@@ -21,12 +21,12 @@ import (
"context" "context"
"fmt" "fmt"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/modelschemas" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/modelschemas"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/schemasv1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/schemasv1"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/consts" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/consts"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/reqcli" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/reqcli"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/utils" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/utils"
) )
type DynamoAuthHeaders struct { type DynamoAuthHeaders struct {
......
...@@ -18,7 +18,7 @@ ...@@ -18,7 +18,7 @@
package v1alpha1 package v1alpha1
import ( import (
dynamoCommon "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/common" dynamoCommon "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/common"
corev1 "k8s.io/api/core/v1" corev1 "k8s.io/api/core/v1"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
) )
......
...@@ -18,8 +18,8 @@ ...@@ -18,8 +18,8 @@
package v1alpha1 package v1alpha1
import ( import (
dynamoCommon "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/common" dynamoCommon "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/common"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/modelschemas" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/modelschemas"
corev1 "k8s.io/api/core/v1" corev1 "k8s.io/api/core/v1"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
) )
......
...@@ -21,8 +21,8 @@ limitations under the License. ...@@ -21,8 +21,8 @@ limitations under the License.
package v1alpha1 package v1alpha1
import ( import (
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/common" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/common"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/modelschemas" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/modelschemas"
"k8s.io/api/autoscaling/v2" "k8s.io/api/autoscaling/v2"
corev1 "k8s.io/api/core/v1" corev1 "k8s.io/api/core/v1"
"k8s.io/apimachinery/pkg/apis/meta/v1" "k8s.io/apimachinery/pkg/apis/meta/v1"
......
...@@ -36,9 +36,9 @@ import ( ...@@ -36,9 +36,9 @@ import (
metricsserver "sigs.k8s.io/controller-runtime/pkg/metrics/server" metricsserver "sigs.k8s.io/controller-runtime/pkg/metrics/server"
"sigs.k8s.io/controller-runtime/pkg/webhook" "sigs.k8s.io/controller-runtime/pkg/webhook"
nvidiacomv1alpha1 "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1" nvidiacomv1alpha1 "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/internal/controller" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/internal/controller"
commonController "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/internal/controller_common" commonController "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/internal/controller_common"
istioclientsetscheme "istio.io/client-go/pkg/clientset/versioned/scheme" istioclientsetscheme "istio.io/client-go/pkg/clientset/versioned/scheme"
//+kubebuilder:scaffold:imports //+kubebuilder:scaffold:imports
) )
......
module github.com/dynemo-ai/dynemo/deploy/dynamo/operator module github.com/ai-dynamo/dynamo/deploy/dynamo/operator
go 1.23.0 go 1.23.0
......
...@@ -20,7 +20,7 @@ package controller ...@@ -20,7 +20,7 @@ package controller
import ( import (
"strings" "strings"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1"
corev1 "k8s.io/api/core/v1" corev1 "k8s.io/api/core/v1"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
) )
......
...@@ -34,9 +34,9 @@ import ( ...@@ -34,9 +34,9 @@ import (
"sigs.k8s.io/controller-runtime/pkg/log" "sigs.k8s.io/controller-runtime/pkg/log"
"sigs.k8s.io/controller-runtime/pkg/predicate" "sigs.k8s.io/controller-runtime/pkg/predicate"
nvidiacomv1alpha1 "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1" nvidiacomv1alpha1 "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1"
commonController "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/internal/controller_common" commonController "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/internal/controller_common"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/internal/nim" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/internal/nim"
) )
const ( const (
......
...@@ -36,16 +36,16 @@ import ( ...@@ -36,16 +36,16 @@ import (
"emperror.dev/errors" "emperror.dev/errors"
"github.com/cisco-open/k8s-objectmatcher/patch" "github.com/cisco-open/k8s-objectmatcher/patch"
dynamoCommon "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/common" dynamoCommon "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/common"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/modelschemas" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/modelschemas"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/schemasv1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/schemasv1"
yataiclient "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/yatai-client" yataiclient "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/yatai-client"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/internal/controller_common" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/internal/controller_common"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/internal/envoy" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/internal/envoy"
commonconfig "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/config" commonconfig "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/config"
commonconsts "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/consts" commonconsts "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/consts"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/system" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/system"
"github.com/huandu/xstrings" "github.com/huandu/xstrings"
"github.com/jinzhu/copier" "github.com/jinzhu/copier"
"github.com/prometheus/common/version" "github.com/prometheus/common/version"
...@@ -70,7 +70,7 @@ import ( ...@@ -70,7 +70,7 @@ import (
"sigs.k8s.io/controller-runtime/pkg/predicate" "sigs.k8s.io/controller-runtime/pkg/predicate"
"sigs.k8s.io/controller-runtime/pkg/reconcile" "sigs.k8s.io/controller-runtime/pkg/reconcile"
compounadaiConversion "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/conversion" compounadaiConversion "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/conversion"
) )
const ( const (
......
...@@ -35,9 +35,9 @@ import ( ...@@ -35,9 +35,9 @@ import (
"emperror.dev/errors" "emperror.dev/errors"
"github.com/apparentlymart/go-shquot/shquot" "github.com/apparentlymart/go-shquot/shquot"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/internal/controller_common" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/internal/controller_common"
commonconfig "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/config" commonconfig "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/config"
commonconsts "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/consts" commonconsts "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/consts"
"github.com/ettle/strcase" "github.com/ettle/strcase"
"github.com/huandu/xstrings" "github.com/huandu/xstrings"
"github.com/mitchellh/hashstructure/v2" "github.com/mitchellh/hashstructure/v2"
...@@ -63,11 +63,11 @@ import ( ...@@ -63,11 +63,11 @@ import (
"sigs.k8s.io/controller-runtime/pkg/log" "sigs.k8s.io/controller-runtime/pkg/log"
"sigs.k8s.io/controller-runtime/pkg/predicate" "sigs.k8s.io/controller-runtime/pkg/predicate"
dynamoCommon "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/common" dynamoCommon "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/common"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/modelschemas" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/modelschemas"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/schemasv1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/schemasv1"
yataiclient "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/yatai-client" yataiclient "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/yatai-client"
nvidiacomv1alpha1 "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1" nvidiacomv1alpha1 "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1"
) )
const ( const (
......
...@@ -24,7 +24,7 @@ import ( ...@@ -24,7 +24,7 @@ import (
"runtime" "runtime"
"testing" "testing"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1"
. "github.com/onsi/ginkgo/v2" . "github.com/onsi/ginkgo/v2"
. "github.com/onsi/gomega" . "github.com/onsi/gomega"
monitoringv1 "github.com/prometheus-operator/prometheus-operator/pkg/apis/monitoring/v1" monitoringv1 "github.com/prometheus-operator/prometheus-operator/pkg/apis/monitoring/v1"
......
...@@ -26,20 +26,20 @@ import ( ...@@ -26,20 +26,20 @@ import (
"strings" "strings"
"emperror.dev/errors" "emperror.dev/errors"
compounaiCommon "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/common" compounaiCommon "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/common"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/modelschemas" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/modelschemas"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/schemasv1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/schemasv1"
yataiclient "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/yatai-client" yataiclient "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/yatai-client"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1"
commonconfig "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/config" commonconfig "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/config"
commonconsts "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/pkg/dynamo/consts" commonconsts "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/pkg/dynamo/consts"
"github.com/huandu/xstrings" "github.com/huandu/xstrings"
corev1 "k8s.io/api/core/v1" corev1 "k8s.io/api/core/v1"
k8serrors "k8s.io/apimachinery/pkg/api/errors" k8serrors "k8s.io/apimachinery/pkg/api/errors"
"k8s.io/apimachinery/pkg/runtime" "k8s.io/apimachinery/pkg/runtime"
"sigs.k8s.io/controller-runtime/pkg/log" "sigs.k8s.io/controller-runtime/pkg/log"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/internal/archive" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/internal/archive"
"gopkg.in/yaml.v2" "gopkg.in/yaml.v2"
) )
......
...@@ -20,8 +20,8 @@ package nim ...@@ -20,8 +20,8 @@ package nim
import ( import (
"testing" "testing"
compounaiCommon "github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/dynamo/common" compounaiCommon "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/dynamo/common"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/api/v1alpha1" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/api/v1alpha1"
"github.com/onsi/gomega" "github.com/onsi/gomega"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
) )
......
...@@ -25,7 +25,7 @@ import ( ...@@ -25,7 +25,7 @@ import (
. "github.com/onsi/ginkgo/v2" . "github.com/onsi/ginkgo/v2"
. "github.com/onsi/gomega" . "github.com/onsi/gomega"
"github.com/dynemo-ai/dynemo/deploy/dynamo/operator/test/utils" "github.com/ai-dynamo/dynamo/deploy/dynamo/operator/test/utils"
) )
const namespace = "dynamo-kubernetes-operator-system" const namespace = "dynamo-kubernetes-operator-system"
......
...@@ -20,7 +20,7 @@ from bentoml._internal.context import server_context # type: ignore ...@@ -20,7 +20,7 @@ from bentoml._internal.context import server_context # type: ignore
from dynamo.sdk.lib.decorators import async_onstart, dynamo_api, dynamo_endpoint from dynamo.sdk.lib.decorators import async_onstart, dynamo_api, dynamo_endpoint
from dynamo.sdk.lib.dependency import depends from dynamo.sdk.lib.dependency import depends
from dynamo.sdk.lib.image import DYNEMO_IMAGE from dynamo.sdk.lib.image import DYNAMO_IMAGE
from dynamo.sdk.lib.service import service from dynamo.sdk.lib.service import service
dynamo_context: dict[str, Any] = {} dynamo_context: dict[str, Any] = {}
...@@ -32,7 +32,7 @@ __all__ = [ ...@@ -32,7 +32,7 @@ __all__ = [
"dynamo_api", "dynamo_api",
"dynamo_endpoint", "dynamo_endpoint",
"depends", "depends",
"DYNEMO_IMAGE", "DYNAMO_IMAGE",
"service", "service",
"dynamo_context", "dynamo_context",
] ]
...@@ -21,5 +21,5 @@ import bentoml ...@@ -21,5 +21,5 @@ import bentoml
# TODO: "dynamo:latest-vllm" image will not be available to image builder in k8s # TODO: "dynamo:latest-vllm" image will not be available to image builder in k8s
# so We'd consider publishing the base image for releases to public nvcr.io registry. # so We'd consider publishing the base image for releases to public nvcr.io registry.
image_name = os.getenv("DYNEMO_IMAGE", "dynamo:latest-vllm") image_name = os.getenv("DYNAMO_IMAGE", "dynamo:latest-vllm")
DYNEMO_IMAGE = bentoml.images.PythonImage(base_image=image_name) DYNAMO_IMAGE = bentoml.images.PythonImage(base_image=image_name)
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment