File tree Expand file tree Collapse file tree 9 files changed +20
-20
lines changed Expand file tree Collapse file tree 9 files changed +20
-20
lines changed Original file line number Diff line number Diff line change @@ -92,7 +92,7 @@ Edit the template to match your environment:
9292
9393``` yaml
9494# Update image registry and tag
95- image : your -registry/sglang-runtime:your -tag
95+ image : my -registry/sglang-runtime:my -tag
9696
9797# Configure your model
9898args :
Original file line number Diff line number Diff line change @@ -141,7 +141,7 @@ Edit the template to match your environment:
141141
142142``` yaml
143143# Update image registry and tag
144- image : your -registry/trtllm-runtime:your -tag
144+ image : my -registry/trtllm-runtime:my -tag
145145
146146# Configure your model and deployment settings
147147args :
Original file line number Diff line number Diff line change 3434 replicas : 1
3535 extraPodSpec :
3636 mainContainer :
37- image : nvcr.io/nvidia/ai-dynamo/tensorrtllm-runtime:0.4.1
37+ image : nvcr.io/nvidia/ai-dynamo/tensorrtllm-runtime:my-tag
3838 TRTLLMWorker :
3939 envFromSecret : hf-token-secret
4040 dynamoNamespace : trtllm-agg
5050 configMap :
5151 name : nvidia-config
5252 mainContainer :
53- image : nvcr.io/nvidia/ai-dynamo/tensorrtllm-runtime:0.4.1
53+ image : nvcr.io/nvidia/ai-dynamo/tensorrtllm-runtime:my-tag
5454 workingDir : /workspace/components/backends/trtllm
5555 # mount the configmap as a volume
5656 volumeMounts :
Original file line number Diff line number Diff line change @@ -116,7 +116,7 @@ Edit the template to match your environment:
116116
117117``` yaml
118118# Update image registry and tag
119- image : your -registry/vllm-runtime:your -tag
119+ image : my -registry/vllm-runtime:my -tag
120120
121121# Configure your model
122122args :
Original file line number Diff line number Diff line change 1313 replicas : 1
1414 extraPodSpec :
1515 mainContainer :
16- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
16+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
1717 VllmDecodeWorker :
1818 envFromSecret : hf-token-secret
1919 dynamoNamespace : vllm-agg
2424 gpu : " 1"
2525 extraPodSpec :
2626 mainContainer :
27- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
27+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
2828 workingDir : /workspace/components/backends/vllm
2929 command :
3030 - /bin/sh
Original file line number Diff line number Diff line change 1313 replicas : 1
1414 extraPodSpec :
1515 mainContainer :
16- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
16+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
1717 envs :
1818 - name : DYN_ROUTER_MODE
1919 value : kv
2727 gpu : " 1"
2828 extraPodSpec :
2929 mainContainer :
30- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
30+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
3131 workingDir : /workspace/components/backends/vllm
3232 command :
3333 - /bin/sh
Original file line number Diff line number Diff line change 1313 replicas : 1
1414 extraPodSpec :
1515 mainContainer :
16- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
16+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
1717 VllmDecodeWorker :
1818 dynamoNamespace : vllm-disagg
1919 envFromSecret : hf-token-secret
2424 gpu : " 1"
2525 extraPodSpec :
2626 mainContainer :
27- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
27+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
2828 workingDir : /workspace/components/backends/vllm
2929 command :
3030 - /bin/sh
4141 gpu : " 1"
4242 extraPodSpec :
4343 mainContainer :
44- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
44+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
4545 workingDir : /workspace/components/backends/vllm
4646 command :
4747 - /bin/sh
Original file line number Diff line number Diff line change 2020 replicas : 1
2121 extraPodSpec :
2222 mainContainer :
23- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
23+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
2424 Planner :
2525 dynamoNamespace : vllm-disagg-planner
2626 envFromSecret : hf-token-secret
5151 mountPoint : /data/profiling_results
5252 extraPodSpec :
5353 mainContainer :
54- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
54+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
5555 workingDir : /workspace/components/planner/src/dynamo/planner
5656 command :
5757 - /bin/sh
9191 failureThreshold : 10
9292 extraPodSpec :
9393 mainContainer :
94- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
94+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
9595 workingDir : /workspace/components/backends/vllm
9696 command :
9797 - /bin/sh
@@ -114,7 +114,7 @@ spec:
114114 port : 9090
115115 periodSeconds : 10
116116 failureThreshold : 60
117- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
117+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
118118 workingDir : /workspace/components/backends/vllm
119119 command :
120120 - python3
@@ -139,7 +139,7 @@ spec:
139139 port : 9090
140140 periodSeconds : 10
141141 failureThreshold : 60
142- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
142+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
143143 workingDir : /workspace/components/backends/vllm
144144 command :
145145 - python3
Original file line number Diff line number Diff line change 1313 replicas : 1
1414 extraPodSpec :
1515 mainContainer :
16- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
16+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
1717 envs :
1818 - name : DYN_ROUTER_MODE
1919 value : kv
2727 gpu : " 1"
2828 extraPodSpec :
2929 mainContainer :
30- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
30+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
3131 workingDir : /workspace/components/backends/vllm
3232 command :
3333 - /bin/sh
4444 gpu : " 1"
4545 extraPodSpec :
4646 mainContainer :
47- image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:0.4.1
47+ image : nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag
4848 workingDir : /workspace/components/backends/vllm
4949 command :
5050 - /bin/sh
You can’t perform that action at this time.
0 commit comments