Unverified Commit 9e2a2cc9 authored by Julien Mancuso's avatar Julien Mancuso Committed by GitHub
Browse files

feat: add epp component (#5611)


Signed-off-by: default avatarJulien Mancuso <jmancuso@nvidia.com>
parent 6271a31f
...@@ -92,6 +92,8 @@ type RBACConfig struct { ...@@ -92,6 +92,8 @@ type RBACConfig struct {
PlannerClusterRoleName string PlannerClusterRoleName string
// DGDRProfilingClusterRoleName is the name of the ClusterRole for DGDR profiling jobs (cluster-wide mode only) // DGDRProfilingClusterRoleName is the name of the ClusterRole for DGDR profiling jobs (cluster-wide mode only)
DGDRProfilingClusterRoleName string DGDRProfilingClusterRoleName string
// EPPClusterRoleName is the name of the ClusterRole for EPP (cluster-wide mode only)
EPPClusterRoleName string
} }
type IngressConfig struct { type IngressConfig struct {
...@@ -129,6 +131,12 @@ func DetectKaiSchedulerAvailability(ctx context.Context, mgr ctrl.Manager) bool ...@@ -129,6 +131,12 @@ func DetectKaiSchedulerAvailability(ctx context.Context, mgr ctrl.Manager) bool
return detectAPIGroupAvailability(ctx, mgr, "scheduling.run.ai") return detectAPIGroupAvailability(ctx, mgr, "scheduling.run.ai")
} }
// DetectInferencePoolAvailability checks if the Gateway API Inference Extension is available
// by checking if the inference.networking.k8s.io API group is registered
func DetectInferencePoolAvailability(ctx context.Context, mgr ctrl.Manager) bool {
return detectAPIGroupAvailability(ctx, mgr, "inference.networking.k8s.io")
}
// detectAPIGroupAvailability checks if a specific API group is registered in the cluster // detectAPIGroupAvailability checks if a specific API group is registered in the cluster
func detectAPIGroupAvailability(ctx context.Context, mgr ctrl.Manager, groupName string) bool { func detectAPIGroupAvailability(ctx context.Context, mgr ctrl.Manager, groupName string) bool {
logger := log.FromContext(ctx) logger := log.FromContext(ctx)
......
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
...@@ -8,6 +8,7 @@ metadata: ...@@ -8,6 +8,7 @@ metadata:
spec: spec:
services: services:
Frontend: Frontend:
envFromSecret: hf-token-secret
componentType: frontend componentType: frontend
replicas: 1 replicas: 1
extraPodSpec: extraPodSpec:
......
This diff is collapsed.
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment