File tree Expand file tree Collapse file tree 3 files changed +5
-5
lines changed
components/backends/vllm/deploy Expand file tree Collapse file tree 3 files changed +5
-5
lines changed Original file line number Diff line number Diff line change 8080 image : nvcr.io/nvidian/nim-llm-dev/vllm_v1-runtime:dep-216.4
8181 workingDir : /workspace/components/backends/vllm
8282 args :
83- - " python3 components/main.py --model Qwen/Qwen3-0.6B --enforce-eager 2>&1 | tee /tmp/vllm.log"
83+ - " python3 -m dynamo.vllm --model Qwen/Qwen3-0.6B --enforce-eager 2>&1 | tee /tmp/vllm.log"
Original file line number Diff line number Diff line change 8080 image : nvcr.io/nvidian/nim-llm-dev/vllm_v1-runtime:dep-216.4
8181 workingDir : /workspace/components/backends/vllm
8282 args :
83- - " python3 components/main.py --model Qwen/Qwen3-0.6B --enforce-eager 2>&1 | tee /tmp/vllm.log"
83+ - " python3 -m dynamo.vllm --model Qwen/Qwen3-0.6B --enforce-eager 2>&1 | tee /tmp/vllm.log"
8484 VllmPrefillWorker :
8585 dynamoNamespace : vllm-v1-disagg
8686 envFromSecret : hf-token-secret
@@ -119,4 +119,4 @@ spec:
119119 image : nvcr.io/nvidian/nim-llm-dev/vllm_v1-runtime:dep-216.4
120120 workingDir : /workspace/components/backends/vllm
121121 args :
122- - " python3 components/main.py --model Qwen/Qwen3-0.6B --enforce-eager --is-prefill-worker 2>&1 | tee /tmp/vllm.log"
122+ - " python3 -m dynamo.vllm --model Qwen/Qwen3-0.6B --enforce-eager --is-prefill-worker 2>&1 | tee /tmp/vllm.log"
Original file line number Diff line number Diff line change 8080 image : nvcr.io/nvidian/nim-llm-dev/vllm_v1-runtime:dep-216.4
8181 workingDir : /workspace/components/backends/vllm
8282 args :
83- - " python3 components/main.py --model Qwen/Qwen3-0.6B --enforce-eager 2>&1 | tee /tmp/vllm.log"
83+ - " python3 -m dynamo.vllm --model Qwen/Qwen3-0.6B --enforce-eager 2>&1 | tee /tmp/vllm.log"
8484 VllmPrefillWorker :
8585 dynamoNamespace : vllm-v1-disagg-planner
8686 envFromSecret : hf-token-secret
@@ -119,4 +119,4 @@ spec:
119119 image : nvcr.io/nvidian/nim-llm-dev/vllm_v1-runtime:dep-216.4
120120 workingDir : /workspace/components/backends/vllm
121121 args :
122- - " python3 components/main.py --model Qwen/Qwen3-0.6B --enforce-eager --is-prefill-worker 2>&1 | tee /tmp/vllm.log"
122+ - " python3 -m dynamo.vllm --model Qwen/Qwen3-0.6B --enforce-eager --is-prefill-worker 2>&1 | tee /tmp/vllm.log"
You can’t perform that action at this time.
0 commit comments