Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
28 changes: 17 additions & 11 deletions container/Dockerfile.sglang-wideep
Original file line number Diff line number Diff line change
Expand Up @@ -71,20 +71,11 @@ RUN rm -rf /opt/hpcx/ucx && \

ENV LD_LIBRARY_PATH=/usr/lib:/usr/local/ucx/lib:$LD_LIBRARY_PATH

# Pinning to NIXL 0.2.1 right now
# There is a fix that was merged into SGLang after 0.4.8.post1
# TODO: Investigate perf hit of that change before we bump to up to date NIXL
ARG NIXL_COMMIT="5e4c179ee850d482a83cb2a211e0947e46281060"
RUN git clone https://github.com/ai-dynamo/nixl.git && cd nixl && git checkout ${NIXL_COMMIT} && pip install --break-system-packages . --config-settings=setup-args="-Ducx_path=/usr/local/ucx"
ARG NIXL_TAG=0.3.1
RUN git clone https://github.com/ai-dynamo/nixl.git && cd nixl && git checkout ${NIXL_TAG} && pip install --break-system-packages . --config-settings=setup-args="-Ducx_path=/usr/local/ucx"

WORKDIR /sgl-workspace

RUN pip uninstall --break-system-packages -y sglang
RUN rm -rf sglang
# Pinning to 0.4.8.post1 for now which solves a TBO issue
# https://github.com/sgl-project/sglang/issues/7511
RUN pip install --break-system-packages "sglang==0.4.8.post1"

# Allow forceful shutdown of inflight requests
ENV SGL_FORCE_SHUTDOWN=1

Expand Down Expand Up @@ -149,6 +140,21 @@ RUN wget --tries=3 --waitretry=5 https://github.com/etcd-io/etcd/releases/downlo
rm /tmp/etcd.tar.gz
ENV PATH=/usr/local/bin/etcd/:$PATH

ARG CMAKE_VERSION=3.31.8
RUN mkdir /sgl-workspace/cmake_build
WORKDIR /sgl-workspace/cmake_build

# uninstall CMake
RUN apt-get purge -y cmake
# download newer version of CMake
RUN wget https://github.com/Kitware/CMake/releases/download/v${CMAKE_VERSION}/cmake-${CMAKE_VERSION}-linux-$(uname -m).tar.gz && \
tar -xvzf cmake-${CMAKE_VERSION}-linux-$(uname -m).tar.gz && \
mv cmake-${CMAKE_VERSION}-linux-$(uname -m) custom_cmake
ENV PATH=/sgl-workspace/cmake_build/custom_cmake/bin:$PATH

# should be 3.31.8
RUN cmake --version

# Install perf_analyzer and genai-perf
RUN apt-get update -y && \
apt-get install -y --no-install-recommends \
Expand Down
2 changes: 1 addition & 1 deletion examples/sglang/docs/dsr1-wideep-h100.md
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,7 @@ Dynamo supports SGLang's implementation of wide expert parallelism and large sca
1. Build the SGLang DeepEP container.

```bash
git clone -b v0.4.8.post1 https://github.com/sgl-project/sglang.git
git clone -b v0.4.9.post2 https://github.com/sgl-project/sglang.git
cd sglang/docker
docker build -f Dockerfile -t sgl-widepep .
```
Expand Down
Loading