-
-
Notifications
You must be signed in to change notification settings - Fork 18.6k
python3Packages.vllm: 0.11.0 -> 0.11.2 #463032
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Merged
happysalada
merged 1 commit into
NixOS:master
from
GaetanLepage:update/python3Packages.vllm
Nov 23, 2025
Merged
Changes from all commits
Commits
File filter
Filter by extension
Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
There are no files selected for viewing
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
13 changes: 7 additions & 6 deletions
13
pkgs/development/python-modules/vllm/0003-propagate-pythonpath.patch
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -1,12 +1,13 @@ | ||
| diff --git a/vllm/model_executor/models/registry.py b/vllm/model_executor/models/registry.py | ||
| index 81623def..2a6e2c92 100644 | ||
| index a2de597c8..4c2410209 100644 | ||
| --- a/vllm/model_executor/models/registry.py | ||
| +++ b/vllm/model_executor/models/registry.py | ||
| @@ -521,6 +521,7 @@ def _run_in_subprocess(fn: Callable[[], _T]) -> _T: | ||
| @@ -1121,7 +1121,7 @@ def _run_in_subprocess(fn: Callable[[], _T]) -> _T: | ||
| # cannot use `sys.executable __file__` here because the script | ||
| # contains relative imports | ||
| returned = subprocess.run(_SUBPROCESS_COMMAND, | ||
| input=input_bytes, | ||
| + env={'PYTHONPATH': ':'.join(sys.path)}, | ||
| capture_output=True) | ||
| returned = subprocess.run( | ||
| - _SUBPROCESS_COMMAND, input=input_bytes, capture_output=True | ||
| + _SUBPROCESS_COMMAND, input=input_bytes, capture_output=True, env={'PYTHONPATH': ':'.join(sys.path)}, | ||
| ) | ||
|
|
||
| # check if the subprocess is successful |
4 changes: 2 additions & 2 deletions
4
pkgs/development/python-modules/vllm/0005-drop-intel-reqs.patch
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -34,6 +34,7 @@ | |
| uvicorn, | ||
| pydantic, | ||
| aioprometheus, | ||
| anthropic, | ||
| nvidia-ml-py, | ||
| openai, | ||
| pyzmq, | ||
|
|
@@ -53,6 +54,7 @@ | |
| compressed-tensors, | ||
| mistral-common, | ||
| msgspec, | ||
| model-hosting-container-standards, | ||
| numactl, | ||
| tokenizers, | ||
| oneDNN, | ||
|
|
@@ -98,10 +100,11 @@ let | |
| # see CMakeLists.txt, grepping for CUTLASS_REVISION | ||
| # https://github.com/vllm-project/vllm/blob/v${version}/CMakeLists.txt | ||
| cutlass = fetchFromGitHub { | ||
| name = "cutlass-source"; | ||
| owner = "NVIDIA"; | ||
| repo = "cutlass"; | ||
| tag = "v4.0.0"; | ||
| hash = "sha256-HJY+Go1viPkSVZPEs/NyMtYJzas4mMLiIZF3kNX+WgA="; | ||
| tag = "v4.2.1"; | ||
| hash = "sha256-iP560D5Vwuj6wX1otJhwbvqe/X4mYVeKTpK533Wr5gY="; | ||
| }; | ||
|
|
||
| # FlashMLA's Blackwell (SM100) kernels were developed against CUTLASS v3.9.0 | ||
|
|
@@ -126,10 +129,11 @@ let | |
| # grep for GIT_TAG in the following file | ||
| # https://github.com/vllm-project/vllm/blob/v${version}/cmake/external_projects/flashmla.cmake | ||
| src = fetchFromGitHub { | ||
| name = "FlashMLA-source"; | ||
| owner = "vllm-project"; | ||
| repo = "FlashMLA"; | ||
| rev = "5f65b85703c7ed75fda01e06495077caad207c3f"; | ||
| hash = "sha256-DO9EFNSoAgyfRRc095v1UjT+Zdzk4cFY0+n28FVEwI0="; | ||
| rev = "46d64a8ebef03fa50b4ae74937276a5c940e3f95"; | ||
| hash = "sha256-jtMzWB5hKz8mJGsdK6q4YpQbGp9IrQxbwmB3a64DIl0="; | ||
| }; | ||
|
|
||
| dontConfigure = true; | ||
|
|
@@ -145,6 +149,16 @@ let | |
| ''; | ||
| }; | ||
|
|
||
| # grep for GIT_TAG in the following file | ||
| # https://github.com/vllm-project/vllm/blob/v${version}/cmake/external_projects/qutlass.cmake | ||
| qutlass = fetchFromGitHub { | ||
| name = "qutlass-source"; | ||
| owner = "IST-DASLab"; | ||
| repo = "qutlass"; | ||
| rev = "830d2c4537c7396e14a02a46fbddd18b5d107c65"; | ||
| hash = "sha256-aG4qd0vlwP+8gudfvHwhtXCFmBOJKQQTvcwahpEqC84="; | ||
| }; | ||
|
|
||
| vllm-flash-attn' = lib.defaultTo (stdenv.mkDerivation { | ||
| pname = "vllm-flash-attn"; | ||
| # https://github.com/vllm-project/flash-attention/blob/${src.rev}/vllm_flash_attn/__init__.py | ||
|
|
@@ -153,10 +167,11 @@ let | |
| # grep for GIT_TAG in the following file | ||
| # https://github.com/vllm-project/vllm/blob/v${version}/cmake/external_projects/vllm_flash_attn.cmake | ||
| src = fetchFromGitHub { | ||
| name = "flash-attention-source"; | ||
| owner = "vllm-project"; | ||
| repo = "flash-attention"; | ||
| rev = "ee4d25bd84e0cbc7e0b9b9685085fd5db2dcb62a"; | ||
| hash = "sha256-2r0Habd/kBpvM4/aQFIYyj+uQAa3M9gjk3DcBZHFNfA="; | ||
| rev = "58e0626a692f09241182582659e3bf8f16472659"; | ||
| hash = "sha256-ewdZd7LuBKBV0y3AaGRWISJzjg6cu59D2OtgqoDjrbM="; | ||
| }; | ||
|
|
||
| patches = [ | ||
|
|
@@ -284,7 +299,7 @@ in | |
|
|
||
| buildPythonPackage rec { | ||
| pname = "vllm"; | ||
| version = "0.11.0"; | ||
| version = "0.11.2"; | ||
| pyproject = true; | ||
|
|
||
| stdenv = torch.stdenv; | ||
|
|
@@ -293,38 +308,31 @@ buildPythonPackage rec { | |
| owner = "vllm-project"; | ||
| repo = "vllm"; | ||
| tag = "v${version}"; | ||
| hash = "sha256-47TPvvPQvVbh6Gm2yvi+xhWZ8tSma91rp9hp/SBrEY8="; | ||
| hash = "sha256-DoSlkFmR3KKEtfSfdRB++0CZeeXgxmM3zZjONlxbe8U="; | ||
| }; | ||
|
|
||
| patches = [ | ||
| ./0002-setup.py-nix-support-respect-cmakeFlags.patch | ||
| ./0003-propagate-pythonpath.patch | ||
| ./0005-drop-intel-reqs.patch | ||
| # TODO: Remove the below patches when included in vLLM release | ||
| (fetchpatch { | ||
| url = "https://github.com/vllm-project/vllm/commit/9705fba7b727a3b9c275b012258608531e2223d1.patch"; | ||
| hash = "sha256-DxRGLiwkegMlMjqFmFc0igpaVv06/Y2WjL+ISoIOET4="; | ||
| }) | ||
| # patch above is previous commit needed to apply patch below | ||
| # oneDNN / CPU fix from https://github.com/vllm-project/vllm/pull/26401 | ||
| (fetchpatch { | ||
| url = "https://github.com/vllm-project/vllm/commit/d7be1f2a480bdc62a6a1ec0126a401e3d42985fe.patch"; | ||
| hash = "sha256-Zi1k5wiOPjsbWHFKpcLq9Ns43wIP37Mbvesi5K80zaQ="; | ||
| }) | ||
| ]; | ||
|
|
||
| postPatch = '' | ||
| # Remove vendored pynvml entirely | ||
| rm vllm/third_party/pynvml.py | ||
| substituteInPlace tests/utils.py \ | ||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
[daniel@laptop:~/Source/vllm]$ git switch --detach v0.11.2
HEAD is now at 275de3417 [BugFix] Fix false assertion with spec-decode=[2,4,..] and TP>2 (#29036)
[daniel@laptop:~/Source/vllm]$ grep -R vllm.third_party.pynvml --exclude-dir=.git
tests/utils.py: from vllm.third_party.pynvml import (
vllm/utils/import_utils.py: import vllm.third_party.pynvml as pynvml |
||
| --replace-fail "from vllm.third_party.pynvml import" "from pynvml import" | ||
| substituteInPlace vllm/utils/__init__.py \ | ||
| --replace-fail "import vllm.third_party.pynvml" "import pynvml" | ||
| --replace-fail \ | ||
| "from vllm.third_party.pynvml import" \ | ||
| "from pynvml import" | ||
| substituteInPlace vllm/utils/import_utils.py \ | ||
| --replace-fail \ | ||
| "import vllm.third_party.pynvml as pynvml" \ | ||
| "import pynvml" | ||
|
|
||
| # pythonRelaxDeps does not cover build-system | ||
| substituteInPlace pyproject.toml \ | ||
| --replace-fail "torch ==" "torch >=" \ | ||
| --replace-fail "setuptools>=77.0.3,<80.0.0" "setuptools" | ||
| --replace-fail "setuptools>=77.0.3,<81.0.0" "setuptools" | ||
|
|
||
| # Ignore the python version check because it hard-codes minor versions and | ||
| # lags behind `ray`'s python interpreter support | ||
|
|
@@ -393,6 +401,7 @@ buildPythonPackage rec { | |
|
|
||
| dependencies = [ | ||
| aioprometheus | ||
| anthropic | ||
| blake3 | ||
| cachetools | ||
| cbor2 | ||
|
|
@@ -424,6 +433,7 @@ buildPythonPackage rec { | |
| partial-json-parser | ||
| compressed-tensors | ||
| mistral-common | ||
| model-hosting-container-standards | ||
| torch | ||
| torchaudio | ||
| torchvision | ||
|
|
@@ -460,6 +470,7 @@ buildPythonPackage rec { | |
| (lib.cmakeFeature "FETCHCONTENT_SOURCE_DIR_CUTLASS" "${lib.getDev cutlass}") | ||
| (lib.cmakeFeature "FLASH_MLA_SRC_DIR" "${lib.getDev flashmla}") | ||
| (lib.cmakeFeature "VLLM_FLASH_ATTN_SRC_DIR" "${lib.getDev vllm-flash-attn'}") | ||
| (lib.cmakeFeature "QUTLASS_SRC_DIR" "${lib.getDev qutlass}") | ||
| (lib.cmakeFeature "TORCH_CUDA_ARCH_LIST" "${gpuTargetString}") | ||
| (lib.cmakeFeature "CUTLASS_NVCC_ARCHS_ENABLED" "${cudaPackages.flags.cmakeCudaArchitecturesString}") | ||
| (lib.cmakeFeature "CUDA_TOOLKIT_ROOT_DIR" "${symlinkJoin { | ||
|
|
||
Oops, something went wrong.
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I thought this needed more ceremony as per https://github.com/daniel-fahey/nixpkgs/blob/4d45e9d901b15422d43c7b1181e5a1ac7e1e0904/pkgs/development/python-modules/vllm/default.nix#L149-L174, but if not, would benefit from adding
# grep for GIT_TAG in the following fileabove# https://github.com/vllm-project/vllm/blob/v${version}/cmake/external_projects/qutlass.cmakefor future maintainers.There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I thought too, but it doesn't seem to need any additional dependencies, so I didn't wrap it in
stdenv.mkDerivation.There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I added the comment.