File tree Expand file tree Collapse file tree 4 files changed +6
-6
lines changed
components/backends/sglang Expand file tree Collapse file tree 4 files changed +6
-6
lines changed Original file line number Diff line number Diff line change 4242 workingDir : /workspace/components/backends/sglang
4343 command : ["sh", "-c"]
4444 args :
45- - " python3 -m dynamo.sglang.utils.clear_namespace --namespace dynamo && python3 -m dynamo.frontend --http-port=8000"
45+ - " python3 -m dynamo.sglang.utils.clear_namespace --namespace sglang-agg && python3 -m dynamo.frontend --http-port=8000"
4646 SGLangDecodeWorker :
4747 envFromSecret : hf-token-secret
4848 livenessProbe :
Original file line number Diff line number Diff line change 4242 workingDir : /workspace/components/backends/sglang
4343 command : ["sh", "-c"]
4444 args :
45- - " python3 -m dynamo.sglang.utils.clear_namespace --namespace dynamo && dynamo run in=http out=dyn --router-mode kv --http-port=8000 "
45+ - " python3 -m dynamo.sglang.utils.clear_namespace --namespace sglang-agg-router && python3 -m dynamo.frontend --http-port=8000 --router-mode kv"
4646 SGLangDecodeWorker :
4747 envFromSecret : hf-token-secret
4848 livenessProbe :
Original file line number Diff line number Diff line change 44apiVersion : nvidia.com/v1alpha1
55kind : DynamoGraphDeployment
66metadata :
7- name : sglang-agg
7+ name : sglang-disagg
88spec :
99 services :
1010 Frontend :
4242 workingDir : /workspace/components/backends/sglang
4343 command : ["sh", "-c"]
4444 args :
45- - " python3 -m dynamo.sglang.utils.clear_namespace --namespace dynamo && python3 -m dynamo.frontend --http-port=8000"
45+ - " python3 -m dynamo.sglang.utils.clear_namespace --namespace sglang-disagg && python3 -m dynamo.frontend --http-port=8000"
4646 SGLangDecodeWorker :
4747 envFromSecret : hf-token-secret
4848 livenessProbe :
Original file line number Diff line number Diff line change @@ -15,7 +15,7 @@ trap cleanup EXIT INT TERM
1515python3 -m dynamo.sglang.utils.clear_namespace --namespace dynamo
1616
1717# run ingress
18- dynamo run in=http out=dyn --http-port=8000 &
18+ python3 -m dynamo.frontend --http-port=8000 &
1919DYNAMO_PID=$!
2020
2121# run prefill worker
@@ -33,7 +33,7 @@ python3 -m dynamo.sglang.worker \
3333PREFILL_PID=$!
3434
3535# run decode worker
36- CUDA_VISIBLE_DEVICES=2,3 python3 dynamo.sglang.decode_worker \
36+ CUDA_VISIBLE_DEVICES=2,3 python3 -m dynamo.sglang.decode_worker \
3737 --model-path silence09/DeepSeek-R1-Small-2layers \
3838 --served-model-name silence09/DeepSeek-R1-Small-2layers \
3939 --tp 2 \
You can’t perform that action at this time.
0 commit comments