Skip to content

Commit 68f22ad

Browse files
committed
fix: sglang examples
1 parent b7f2e9e commit 68f22ad

File tree

4 files changed

+6
-6
lines changed

4 files changed

+6
-6
lines changed

components/backends/sglang/deploy/agg.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,7 @@ spec:
4242
workingDir: /workspace/components/backends/sglang
4343
command: ["sh", "-c"]
4444
args:
45-
- "python3 -m dynamo.sglang.utils.clear_namespace --namespace dynamo && python3 -m dynamo.frontend --http-port=8000"
45+
- "python3 -m dynamo.sglang.utils.clear_namespace --namespace sglang-agg && python3 -m dynamo.frontend --http-port=8000"
4646
SGLangDecodeWorker:
4747
envFromSecret: hf-token-secret
4848
livenessProbe:

components/backends/sglang/deploy/agg_router.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,7 @@ spec:
4242
workingDir: /workspace/components/backends/sglang
4343
command: ["sh", "-c"]
4444
args:
45-
- "python3 -m dynamo.sglang.utils.clear_namespace --namespace dynamo && dynamo run in=http out=dyn --router-mode kv --http-port=8000"
45+
- "python3 -m dynamo.sglang.utils.clear_namespace --namespace sglang-agg-router && python3 -m dynamo.frontend --http-port=8000 --router-mode kv"
4646
SGLangDecodeWorker:
4747
envFromSecret: hf-token-secret
4848
livenessProbe:

components/backends/sglang/deploy/disagg.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
apiVersion: nvidia.com/v1alpha1
55
kind: DynamoGraphDeployment
66
metadata:
7-
name: sglang-agg
7+
name: sglang-disagg
88
spec:
99
services:
1010
Frontend:
@@ -42,7 +42,7 @@ spec:
4242
workingDir: /workspace/components/backends/sglang
4343
command: ["sh", "-c"]
4444
args:
45-
- "python3 -m dynamo.sglang.utils.clear_namespace --namespace dynamo && python3 -m dynamo.frontend --http-port=8000"
45+
- "python3 -m dynamo.sglang.utils.clear_namespace --namespace sglang-disagg && python3 -m dynamo.frontend --http-port=8000"
4646
SGLangDecodeWorker:
4747
envFromSecret: hf-token-secret
4848
livenessProbe:

components/backends/sglang/launch/disagg_dp_attn.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ trap cleanup EXIT INT TERM
1515
python3 -m dynamo.sglang.utils.clear_namespace --namespace dynamo
1616

1717
# run ingress
18-
dynamo run in=http out=dyn --http-port=8000 &
18+
python3 -m dynamo.frontend --http-port=8000 &
1919
DYNAMO_PID=$!
2020

2121
# run prefill worker
@@ -33,7 +33,7 @@ python3 -m dynamo.sglang.worker \
3333
PREFILL_PID=$!
3434

3535
# run decode worker
36-
CUDA_VISIBLE_DEVICES=2,3 python3 dynamo.sglang.decode_worker \
36+
CUDA_VISIBLE_DEVICES=2,3 python3 -m dynamo.sglang.decode_worker \
3737
--model-path silence09/DeepSeek-R1-Small-2layers \
3838
--served-model-name silence09/DeepSeek-R1-Small-2layers \
3939
--tp 2 \

0 commit comments

Comments
 (0)