Skip to content

Commit da0c572

Browse files
authored
chore: update sgl version and fix h100 wideep example (#2169)
1 parent 30d4612 commit da0c572

File tree

5 files changed

+12
-23
lines changed

5 files changed

+12
-23
lines changed

README.md

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -176,7 +176,6 @@ uv pip install ai-dynamo[sglang]
176176

177177
Run the backend/worker like this:
178178
```
179-
# Note the '.worker' in the module path for SGLang
180179
python -m dynamo.sglang.worker --help
181180
```
182181

components/backends/sglang/docs/dsr1-wideep-h100.md

Lines changed: 3 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -9,15 +9,13 @@ Dynamo supports SGLang's implementation of wide expert parallelism and large sca
99

1010
## Instructions
1111

12-
1. Build the SGLang DeepEP container.
12+
1. Pull the SGLang container.
1313

1414
```bash
15-
git clone -b v0.4.9.post2 https://github.com/sgl-project/sglang.git
16-
cd sglang/docker
17-
docker build -f Dockerfile -t sgl-widepep .
15+
docker pull lmsysorg/sglang:latest
1816
```
1917

20-
You will now have a `sgl-widepep:latest` image
18+
You can also pull a specific tag from the [lmsys dockerhub](https://hub.docker.com/r/lmsysorg/sglang/tags)
2119

2220
2. Build the Dynamo container
2321

container/Dockerfile.sglang

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@ ARG ARCH=amd64
2727
ARG ARCH_ALT=x86_64
2828

2929
# Make sure to update the dependency version in pyproject.toml when updating this
30-
ARG SGLANG_VERSION="0.4.9.post1"
30+
ARG SGLANG_VERSION="0.4.9.post6"
3131

3232
##################################
3333
########## Base Image ############

container/Dockerfile.sglang-wideep

Lines changed: 7 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,9 @@
1313
# See the License for the specific language governing permissions and
1414
# limitations under the License.
1515

16-
# Note this container is built from a local dockerfile
17-
# Please see instructions in examples/sglang/README.md
18-
FROM sgl-wideep:latest
16+
# This should be pinned to the sglang version that is installed with Dynamo
17+
# in the pyproject.toml
18+
FROM lmsysorg/sglang:v0.4.9.post6-cu126
1919

2020
# Add NIXL build dependencies
2121
RUN apt-get update -y && \
@@ -80,10 +80,7 @@ WORKDIR /sgl-workspace
8080
ENV SGL_FORCE_SHUTDOWN=1
8181

8282
WORKDIR /sgl-workspace
83-
# include flush cache endpoint and server support
84-
# https://github.com/ai-dynamo/dynamo/pull/1769
85-
ARG DYNAMO_COMMIT="bd91dca6141e05bcfbe9bd4dea54cc58b9e37d75"
86-
RUN git clone https://github.com/ai-dynamo/dynamo.git && cd dynamo && git checkout ${DYNAMO_COMMIT}
83+
RUN git clone https://github.com/ai-dynamo/dynamo.git
8784

8885
# install dynamo in editable mode
8986
WORKDIR /sgl-workspace/dynamo
@@ -126,8 +123,6 @@ RUN cargo build --release
126123
RUN cd lib/bindings/python && pip install --break-system-packages -e . && cd ../../..
127124
RUN pip install --break-system-packages -e .
128125

129-
ENV PYTHONPATH=/sgl-workspace/dynamo/components/planner/src:/sgl-workspace/dynamo/examples/sglang:$PYTHONPATH
130-
131126
RUN wget --tries=3 --waitretry=5 https://github.com/nats-io/nats-server/releases/download/v2.10.28/nats-server-v2.10.28-${ARCH}.deb && \
132127
dpkg -i nats-server-v2.10.28-${ARCH}.deb && rm nats-server-v2.10.28-${ARCH}.deb
133128

@@ -168,7 +163,7 @@ ENV PATH=/sgl-workspace/perf_analyzer/build/perf_analyzer/src/perf-analyzer-buil
168163

169164
RUN pip install --break-system-packages genai-perf
170165

171-
COPY examples/sglang/configs/deepseek_r1/wideep/* /sgl-workspace/dynamo/examples/sglang/configs/
172-
COPY examples/sglang/utils/benchmarking/* /sgl-workspace/dynamo/examples/sglang/utils/
166+
# https://pypi.org/project/sglang-router/0.1.5 is latest
167+
RUN pip install sglang-router==0.1.5
173168

174-
WORKDIR /sgl-workspace/dynamo/examples/sglang
169+
WORKDIR /sgl-workspace/dynamo/components/backends/sglang

pyproject.toml

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -73,10 +73,7 @@ vllm = [
7373
sglang = [
7474
"uvloop",
7575
"nixl",
76-
"sglang[runtime_common]==0.4.9.post1",
77-
"einops",
78-
"sgl-kernel==0.2.4",
79-
"sentencepiece",
76+
"sglang[all]==0.4.9.post6",
8077
]
8178

8279
llama_cpp = [

0 commit comments

Comments
 (0)