diff --git a/.github/configurations/vllm-tensorizer.yml b/.github/configurations/vllm-tensorizer.yml index a46df02..a8c08c1 100644 --- a/.github/configurations/vllm-tensorizer.yml +++ b/.github/configurations/vllm-tensorizer.yml @@ -1,8 +1,8 @@ vllm-commit: - - 'v0.12.0' + - 'v0.15.0' flashinfer-commit: - - 'v0.5.3' + - 'v0.6.1' builder-base-image: - - 'ghcr.io/coreweave/ml-containers/torch:19331b7-nccl-cuda12.9.1-ubuntu22.04-nccl2.29.2-1-torch2.9.1-vision0.24.1-audio2.9.1-abi1' + - 'ghcr.io/coreweave/ml-containers/torch:17ad6db-nccl-cuda12.9.1-ubuntu22.04-nccl2.29.2-1-torch2.10.0-vision0.25.0-audio2.10.0-abi1' final-base-image: - - 'ghcr.io/coreweave/ml-containers/torch:19331b7-nccl-cuda12.9.1-ubuntu22.04-nccl2.29.2-1-torch2.9.1-vision0.24.1-audio2.9.1-abi1' + - 'ghcr.io/coreweave/ml-containers/torch:17ad6db-nccl-cuda12.9.1-ubuntu22.04-nccl2.29.2-1-torch2.10.0-vision0.25.0-audio2.10.0-abi1' diff --git a/vllm-tensorizer/Dockerfile b/vllm-tensorizer/Dockerfile index 69ecbf3..f5f49d4 100644 --- a/vllm-tensorizer/Dockerfile +++ b/vllm-tensorizer/Dockerfile @@ -94,7 +94,7 @@ RUN git clone --filter=tree:0 --no-single-branch --no-checkout \ FROM alpine/git:2.36.3 AS deepgemm-downloader WORKDIR /git -ARG DEEPGEMM_COMMIT='594953acce41793ae00a1233eb516044d604bcb6' +ARG DEEPGEMM_COMMIT='0f5f2662027f0db05d4e3f6a94e56e2d8fc45c51' RUN git clone --filter=tree:0 --no-single-branch --no-checkout \ https://github.com/deepseek-ai/DeepGEMM && \ cd DeepGEMM && \ @@ -107,7 +107,7 @@ FROM builder-base AS vllm-builder RUN --mount=type=bind,from=vllm-downloader,source=/git/vllm,target=/workspace,rw \ . /opt/arch_flags.sh && \ if [ -z "$MAX_JOBS" ]; then unset MAX_JOBS; fi && \ - python3 -m pip install --no-cache-dir py-cpuinfo 'cmake>=3.26.1,<4' && \ + python3 -m pip install --no-cache-dir py-cpuinfo 'cmake>=3.26.1,<4' grpcio-tools && \ if [ -f 'use_existing_torch.py' ]; then \ python3 use_existing_torch.py; \ else \