File tree Expand file tree Collapse file tree 8 files changed +44
-40
lines changed Expand file tree Collapse file tree 8 files changed +44
-40
lines changed Original file line number Diff line number Diff line change @@ -12,10 +12,10 @@ spec:
1212 httpGet :
1313 path : /health
1414 port : 8000
15- initialDelaySeconds : 60
16- periodSeconds : 60
17- timeoutSeconds : 30
18- failureThreshold : 10
15+ initialDelaySeconds : 20
16+ periodSeconds : 5
17+ timeoutSeconds : 5
18+ failureThreshold : 3
1919 readinessProbe :
2020 exec :
2121 command :
Original file line number Diff line number Diff line change @@ -12,10 +12,10 @@ spec:
1212 httpGet :
1313 path : /health
1414 port : 8000
15- initialDelaySeconds : 60
16- periodSeconds : 60
17- timeoutSeconds : 30
18- failureThreshold : 10
15+ initialDelaySeconds : 20
16+ periodSeconds : 5
17+ timeoutSeconds : 5
18+ failureThreshold : 3
1919 readinessProbe :
2020 exec :
2121 command :
Original file line number Diff line number Diff line change @@ -12,10 +12,10 @@ spec:
1212 httpGet :
1313 path : /health
1414 port : 8000
15- initialDelaySeconds : 60
16- periodSeconds : 60
17- timeoutSeconds : 30
18- failureThreshold : 10
15+ initialDelaySeconds : 20
16+ periodSeconds : 5
17+ timeoutSeconds : 5
18+ failureThreshold : 3
1919 readinessProbe :
2020 exec :
2121 command :
Original file line number Diff line number Diff line change @@ -12,20 +12,20 @@ spec:
1212 httpGet :
1313 path : /health
1414 port : 8000
15- initialDelaySeconds : 60
16- periodSeconds : 60
17- timeoutSeconds : 30
18- failureThreshold : 10
15+ initialDelaySeconds : 20
16+ periodSeconds : 5
17+ timeoutSeconds : 5
18+ failureThreshold : 3
1919 readinessProbe :
2020 exec :
2121 command :
2222 - /bin/sh
2323 - -c
2424 - ' curl -s http://localhost:8000/health | jq -e ".status == \"healthy\""'
25- initialDelaySeconds : 60
26- periodSeconds : 60
27- timeoutSeconds : 30
28- failureThreshold : 10
25+ initialDelaySeconds : 10
26+ periodSeconds : 5
27+ timeoutSeconds : 5
28+ failureThreshold : 3
2929 dynamoNamespace : vllm-agg
3030 componentType : main
3131 replicas : 1
@@ -51,15 +51,17 @@ spec:
5151 httpGet :
5252 path : /live
5353 port : 9090
54- periodSeconds : 5
55- timeoutSeconds : 30
56- failureThreshold : 1
54+ initialDelaySeconds : 30
55+ periodSeconds : 10
56+ timeoutSeconds : 5
57+ failureThreshold : 3
5758 readinessProbe :
5859 httpGet :
5960 path : /health
6061 port : 9090
62+ initialDelaySeconds : 30
6163 periodSeconds : 10
62- timeoutSeconds : 30
64+ timeoutSeconds : 5
6365 failureThreshold : 60
6466 dynamoNamespace : vllm-agg
6567 componentType : worker
8688 httpGet :
8789 path : /health
8890 port : 9090
91+ initialDelaySeconds : 10
8992 periodSeconds : 10
93+ timeoutSeconds : 5
9094 failureThreshold : 60
9195 image : nvcr.io/nvidian/nim-llm-dev/vllm-runtime:dep-233.17
9296 workingDir : /workspace/components/backends/vllm
Original file line number Diff line number Diff line change @@ -12,10 +12,10 @@ spec:
1212 httpGet :
1313 path : /health
1414 port : 8000
15- initialDelaySeconds : 60
16- periodSeconds : 60
17- timeoutSeconds : 30
18- failureThreshold : 10
15+ initialDelaySeconds : 20
16+ periodSeconds : 5
17+ timeoutSeconds : 5
18+ failureThreshold : 3
1919 readinessProbe :
2020 exec :
2121 command :
Original file line number Diff line number Diff line change @@ -15,10 +15,10 @@ spec:
1515 httpGet :
1616 path : /health
1717 port : 8000
18- initialDelaySeconds : 60
19- periodSeconds : 60
20- timeoutSeconds : 30
21- failureThreshold : 10
18+ initialDelaySeconds : 20
19+ periodSeconds : 5
20+ timeoutSeconds : 5
21+ failureThreshold : 3
2222 readinessProbe :
2323 exec :
2424 command :
Original file line number Diff line number Diff line change @@ -22,10 +22,10 @@ spec:
2222 httpGet :
2323 path : /health
2424 port : 8000
25- initialDelaySeconds : 60
26- periodSeconds : 60
27- timeoutSeconds : 30
28- failureThreshold : 10
25+ initialDelaySeconds : 20
26+ periodSeconds : 5
27+ timeoutSeconds : 5
28+ failureThreshold : 3
2929 readinessProbe :
3030 exec :
3131 command :
Original file line number Diff line number Diff line change @@ -15,10 +15,10 @@ spec:
1515 httpGet :
1616 path : /health
1717 port : 8000
18- initialDelaySeconds : 60
19- periodSeconds : 60
20- timeoutSeconds : 30
21- failureThreshold : 10
18+ initialDelaySeconds : 20
19+ periodSeconds : 5
20+ timeoutSeconds : 5
21+ failureThreshold : 3
2222 readinessProbe :
2323 exec :
2424 command :
You can’t perform that action at this time.
0 commit comments