Skip to content

Commit b8474e5

Browse files
authored
chore: update cmake and gap installation and sgl in wideep container (#1991)
1 parent 157a3b0 commit b8474e5

File tree

2 files changed

+18
-12
lines changed

2 files changed

+18
-12
lines changed

container/Dockerfile.sglang-wideep

Lines changed: 17 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -71,20 +71,11 @@ RUN rm -rf /opt/hpcx/ucx && \
7171

7272
ENV LD_LIBRARY_PATH=/usr/lib:/usr/local/ucx/lib:$LD_LIBRARY_PATH
7373

74-
# Pinning to NIXL 0.2.1 right now
75-
# There is a fix that was merged into SGLang after 0.4.8.post1
76-
# TODO: Investigate perf hit of that change before we bump to up to date NIXL
77-
ARG NIXL_COMMIT="5e4c179ee850d482a83cb2a211e0947e46281060"
78-
RUN git clone https://github.com/ai-dynamo/nixl.git && cd nixl && git checkout ${NIXL_COMMIT} && pip install --break-system-packages . --config-settings=setup-args="-Ducx_path=/usr/local/ucx"
74+
ARG NIXL_TAG=0.3.1
75+
RUN git clone https://github.com/ai-dynamo/nixl.git && cd nixl && git checkout ${NIXL_TAG} && pip install --break-system-packages . --config-settings=setup-args="-Ducx_path=/usr/local/ucx"
7976

8077
WORKDIR /sgl-workspace
8178

82-
RUN pip uninstall --break-system-packages -y sglang
83-
RUN rm -rf sglang
84-
# Pinning to 0.4.8.post1 for now which solves a TBO issue
85-
# https://github.com/sgl-project/sglang/issues/7511
86-
RUN pip install --break-system-packages "sglang==0.4.8.post1"
87-
8879
# Allow forceful shutdown of inflight requests
8980
ENV SGL_FORCE_SHUTDOWN=1
9081

@@ -149,6 +140,21 @@ RUN wget --tries=3 --waitretry=5 https://github.com/etcd-io/etcd/releases/downlo
149140
rm /tmp/etcd.tar.gz
150141
ENV PATH=/usr/local/bin/etcd/:$PATH
151142

143+
ARG CMAKE_VERSION=3.31.8
144+
RUN mkdir /sgl-workspace/cmake_build
145+
WORKDIR /sgl-workspace/cmake_build
146+
147+
# uninstall CMake
148+
RUN apt-get purge -y cmake
149+
# download newer version of CMake
150+
RUN wget https://github.com/Kitware/CMake/releases/download/v${CMAKE_VERSION}/cmake-${CMAKE_VERSION}-linux-$(uname -m).tar.gz && \
151+
tar -xvzf cmake-${CMAKE_VERSION}-linux-$(uname -m).tar.gz && \
152+
mv cmake-${CMAKE_VERSION}-linux-$(uname -m) custom_cmake
153+
ENV PATH=/sgl-workspace/cmake_build/custom_cmake/bin:$PATH
154+
155+
# should be 3.31.8
156+
RUN cmake --version
157+
152158
# Install perf_analyzer and genai-perf
153159
RUN apt-get update -y && \
154160
apt-get install -y --no-install-recommends \

examples/sglang/docs/dsr1-wideep-h100.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ Dynamo supports SGLang's implementation of wide expert parallelism and large sca
2424
1. Build the SGLang DeepEP container.
2525

2626
```bash
27-
git clone -b v0.4.8.post1 https://github.com/sgl-project/sglang.git
27+
git clone -b v0.4.9.post2 https://github.com/sgl-project/sglang.git
2828
cd sglang/docker
2929
docker build -f Dockerfile -t sgl-widepep .
3030
```

0 commit comments

Comments
 (0)