Unverified Commit 78ffe3d3 authored by atchernych's avatar atchernych Committed by GitHub
Browse files

fix: Adjust frontEnd thrasholds (#2288)

parent 30f33524
...@@ -12,10 +12,10 @@ spec: ...@@ -12,10 +12,10 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 8000 port: 8000
initialDelaySeconds: 60 initialDelaySeconds: 20
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
readinessProbe: readinessProbe:
exec: exec:
command: command:
......
...@@ -12,10 +12,10 @@ spec: ...@@ -12,10 +12,10 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 8000 port: 8000
initialDelaySeconds: 60 initialDelaySeconds: 20
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
readinessProbe: readinessProbe:
exec: exec:
command: command:
......
...@@ -12,10 +12,10 @@ spec: ...@@ -12,10 +12,10 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 8000 port: 8000
initialDelaySeconds: 60 initialDelaySeconds: 20
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
readinessProbe: readinessProbe:
exec: exec:
command: command:
......
...@@ -12,20 +12,20 @@ spec: ...@@ -12,20 +12,20 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 8000 port: 8000
initialDelaySeconds: 60 initialDelaySeconds: 20
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
readinessProbe: readinessProbe:
exec: exec:
command: command:
- /bin/sh - /bin/sh
- -c - -c
- 'curl -s http://localhost:8000/health | jq -e ".status == \"healthy\""' - 'curl -s http://localhost:8000/health | jq -e ".status == \"healthy\""'
initialDelaySeconds: 60 initialDelaySeconds: 10
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
dynamoNamespace: vllm-agg dynamoNamespace: vllm-agg
componentType: main componentType: main
replicas: 1 replicas: 1
...@@ -51,15 +51,17 @@ spec: ...@@ -51,15 +51,17 @@ spec:
httpGet: httpGet:
path: /live path: /live
port: 9090 port: 9090
periodSeconds: 5 initialDelaySeconds: 30
timeoutSeconds: 30 periodSeconds: 10
failureThreshold: 1 timeoutSeconds: 5
failureThreshold: 3
readinessProbe: readinessProbe:
httpGet: httpGet:
path: /health path: /health
port: 9090 port: 9090
initialDelaySeconds: 30
periodSeconds: 10 periodSeconds: 10
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 60 failureThreshold: 60
dynamoNamespace: vllm-agg dynamoNamespace: vllm-agg
componentType: worker componentType: worker
...@@ -86,7 +88,9 @@ spec: ...@@ -86,7 +88,9 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 9090 port: 9090
initialDelaySeconds: 10
periodSeconds: 10 periodSeconds: 10
timeoutSeconds: 5
failureThreshold: 60 failureThreshold: 60
image: nvcr.io/nvidian/nim-llm-dev/vllm-runtime:dep-233.17 image: nvcr.io/nvidian/nim-llm-dev/vllm-runtime:dep-233.17
workingDir: /workspace/components/backends/vllm workingDir: /workspace/components/backends/vllm
......
...@@ -12,10 +12,10 @@ spec: ...@@ -12,10 +12,10 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 8000 port: 8000
initialDelaySeconds: 60 initialDelaySeconds: 20
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
readinessProbe: readinessProbe:
exec: exec:
command: command:
......
...@@ -15,10 +15,10 @@ spec: ...@@ -15,10 +15,10 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 8000 port: 8000
initialDelaySeconds: 60 initialDelaySeconds: 20
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
readinessProbe: readinessProbe:
exec: exec:
command: command:
......
...@@ -22,10 +22,10 @@ spec: ...@@ -22,10 +22,10 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 8000 port: 8000
initialDelaySeconds: 60 initialDelaySeconds: 20
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
readinessProbe: readinessProbe:
exec: exec:
command: command:
......
...@@ -15,10 +15,10 @@ spec: ...@@ -15,10 +15,10 @@ spec:
httpGet: httpGet:
path: /health path: /health
port: 8000 port: 8000
initialDelaySeconds: 60 initialDelaySeconds: 20
periodSeconds: 60 periodSeconds: 5
timeoutSeconds: 30 timeoutSeconds: 5
failureThreshold: 10 failureThreshold: 3
readinessProbe: readinessProbe:
exec: exec:
command: command:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment