Skip to content

Commit 78ffe3d

Browse files
authored
fix: Adjust frontEnd thrasholds (#2288)
1 parent 30f3352 commit 78ffe3d

File tree

8 files changed

+44
-40
lines changed

8 files changed

+44
-40
lines changed

components/backends/sglang/deploy/agg.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,10 +12,10 @@ spec:
1212
httpGet:
1313
path: /health
1414
port: 8000
15-
initialDelaySeconds: 60
16-
periodSeconds: 60
17-
timeoutSeconds: 30
18-
failureThreshold: 10
15+
initialDelaySeconds: 20
16+
periodSeconds: 5
17+
timeoutSeconds: 5
18+
failureThreshold: 3
1919
readinessProbe:
2020
exec:
2121
command:

components/backends/sglang/deploy/agg_router.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,10 +12,10 @@ spec:
1212
httpGet:
1313
path: /health
1414
port: 8000
15-
initialDelaySeconds: 60
16-
periodSeconds: 60
17-
timeoutSeconds: 30
18-
failureThreshold: 10
15+
initialDelaySeconds: 20
16+
periodSeconds: 5
17+
timeoutSeconds: 5
18+
failureThreshold: 3
1919
readinessProbe:
2020
exec:
2121
command:

components/backends/sglang/deploy/disagg.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,10 +12,10 @@ spec:
1212
httpGet:
1313
path: /health
1414
port: 8000
15-
initialDelaySeconds: 60
16-
periodSeconds: 60
17-
timeoutSeconds: 30
18-
failureThreshold: 10
15+
initialDelaySeconds: 20
16+
periodSeconds: 5
17+
timeoutSeconds: 5
18+
failureThreshold: 3
1919
readinessProbe:
2020
exec:
2121
command:

components/backends/vllm/deploy/agg.yaml

Lines changed: 16 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -12,20 +12,20 @@ spec:
1212
httpGet:
1313
path: /health
1414
port: 8000
15-
initialDelaySeconds: 60
16-
periodSeconds: 60
17-
timeoutSeconds: 30
18-
failureThreshold: 10
15+
initialDelaySeconds: 20
16+
periodSeconds: 5
17+
timeoutSeconds: 5
18+
failureThreshold: 3
1919
readinessProbe:
2020
exec:
2121
command:
2222
- /bin/sh
2323
- -c
2424
- 'curl -s http://localhost:8000/health | jq -e ".status == \"healthy\""'
25-
initialDelaySeconds: 60
26-
periodSeconds: 60
27-
timeoutSeconds: 30
28-
failureThreshold: 10
25+
initialDelaySeconds: 10
26+
periodSeconds: 5
27+
timeoutSeconds: 5
28+
failureThreshold: 3
2929
dynamoNamespace: vllm-agg
3030
componentType: main
3131
replicas: 1
@@ -51,15 +51,17 @@ spec:
5151
httpGet:
5252
path: /live
5353
port: 9090
54-
periodSeconds: 5
55-
timeoutSeconds: 30
56-
failureThreshold: 1
54+
initialDelaySeconds: 30
55+
periodSeconds: 10
56+
timeoutSeconds: 5
57+
failureThreshold: 3
5758
readinessProbe:
5859
httpGet:
5960
path: /health
6061
port: 9090
62+
initialDelaySeconds: 30
6163
periodSeconds: 10
62-
timeoutSeconds: 30
64+
timeoutSeconds: 5
6365
failureThreshold: 60
6466
dynamoNamespace: vllm-agg
6567
componentType: worker
@@ -86,7 +88,9 @@ spec:
8688
httpGet:
8789
path: /health
8890
port: 9090
91+
initialDelaySeconds: 10
8992
periodSeconds: 10
93+
timeoutSeconds: 5
9094
failureThreshold: 60
9195
image: nvcr.io/nvidian/nim-llm-dev/vllm-runtime:dep-233.17
9296
workingDir: /workspace/components/backends/vllm

components/backends/vllm/deploy/agg_router.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,10 +12,10 @@ spec:
1212
httpGet:
1313
path: /health
1414
port: 8000
15-
initialDelaySeconds: 60
16-
periodSeconds: 60
17-
timeoutSeconds: 30
18-
failureThreshold: 10
15+
initialDelaySeconds: 20
16+
periodSeconds: 5
17+
timeoutSeconds: 5
18+
failureThreshold: 3
1919
readinessProbe:
2020
exec:
2121
command:

components/backends/vllm/deploy/disagg.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,10 +15,10 @@ spec:
1515
httpGet:
1616
path: /health
1717
port: 8000
18-
initialDelaySeconds: 60
19-
periodSeconds: 60
20-
timeoutSeconds: 30
21-
failureThreshold: 10
18+
initialDelaySeconds: 20
19+
periodSeconds: 5
20+
timeoutSeconds: 5
21+
failureThreshold: 3
2222
readinessProbe:
2323
exec:
2424
command:

components/backends/vllm/deploy/disagg_planner.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -22,10 +22,10 @@ spec:
2222
httpGet:
2323
path: /health
2424
port: 8000
25-
initialDelaySeconds: 60
26-
periodSeconds: 60
27-
timeoutSeconds: 30
28-
failureThreshold: 10
25+
initialDelaySeconds: 20
26+
periodSeconds: 5
27+
timeoutSeconds: 5
28+
failureThreshold: 3
2929
readinessProbe:
3030
exec:
3131
command:

components/backends/vllm/deploy/disagg_router.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,10 +15,10 @@ spec:
1515
httpGet:
1616
path: /health
1717
port: 8000
18-
initialDelaySeconds: 60
19-
periodSeconds: 60
20-
timeoutSeconds: 30
21-
failureThreshold: 10
18+
initialDelaySeconds: 20
19+
periodSeconds: 5
20+
timeoutSeconds: 5
21+
failureThreshold: 3
2222
readinessProbe:
2323
exec:
2424
command:

0 commit comments

Comments
 (0)