Skip to content

Commit d464193

Browse files
authored
enable vLLM upload with CUDA 12.8 build (#465)
1 parent 2559be6 commit d464193

File tree

2 files changed

+43
-44
lines changed

2 files changed

+43
-44
lines changed

.github/packaging/vllm_reqs.txt

Lines changed: 35 additions & 36 deletions
Original file line numberDiff line numberDiff line change
@@ -7,20 +7,20 @@
77
# See the file .github/workflows/gpu_test.yaml for an E2E forge installation using this approach.
88
# TODO: this should be done way less hackily
99
aiohappyeyeballs==2.6.1
10-
aiohttp==3.13.0
10+
aiohttp==3.13.1
1111
aiosignal==1.4.0
1212
annotated-types==0.7.0
1313
anyio==4.11.0
1414
astor==0.8.1
1515
async-timeout==5.0.1
1616
attrs==25.4.0
17-
blake3==1.0.7
18-
cachetools==6.2.0
17+
blake3==1.0.8
18+
cachetools==6.2.1
1919
cbor2==5.7.0
2020
certifi==2025.10.5
2121
cffi==2.0.0
22-
charset-normalizer==3.4.3
23-
click==8.3.0
22+
charset-normalizer==3.4.4
23+
click==8.2.1
2424
cloudpickle==3.1.1
2525
cmake==4.1.0
2626
compressed-tensors==0.10.2
@@ -33,7 +33,7 @@ dnspython==2.8.0
3333
einops==0.8.1
3434
email-validator==2.3.0
3535
exceptiongroup==1.3.0
36-
fastapi==0.118.3
36+
fastapi==0.119.0
3737
fastapi-cli==0.0.13
3838
fastapi-cloud-cli==0.3.1
3939
fastrlock==0.8.3
@@ -47,81 +47,80 @@ httpcore==1.0.9
4747
httptools==0.7.1
4848
httpx==0.28.1
4949
huggingface-hub==0.35.3
50-
idna==3.10
50+
idna==3.11
5151
interegular==0.3.3
5252
Jinja2==3.1.6
53-
jiter==0.11.0
53+
jiter==0.11.1
5454
jsonschema==4.25.1
5555
jsonschema-specifications==2025.9.1
5656
lark==1.2.2
5757
llguidance==0.7.30
5858
llvmlite==0.44.0
5959
lm-format-enforcer==0.10.12
6060
markdown-it-py==4.0.0
61-
MarkupSafe==3.0.2
61+
MarkupSafe==2.1.5
6262
mdurl==0.1.2
6363
mistral_common==1.8.5
6464
mpmath==1.3.0
6565
msgpack==1.1.2
6666
msgspec==0.19.0
6767
multidict==6.7.0
68-
networkx==3.4.2
68+
networkx==3.3
6969
ninja==1.13.0
7070
numba==0.61.2
7171
numpy==2.2.6
72-
nvidia-cublas-cu12==12.9.1.4
73-
nvidia-cuda-cupti-cu12==12.9.79
74-
nvidia-cuda-nvrtc-cu12==12.9.86
75-
nvidia-cuda-runtime-cu12==12.9.79
72+
nvidia-cublas-cu12==12.8.4.1
73+
nvidia-cuda-cupti-cu12==12.8.90
74+
nvidia-cuda-nvrtc-cu12==12.8.93
75+
nvidia-cuda-runtime-cu12==12.8.90
7676
nvidia-cudnn-cu12==9.10.2.21
77-
nvidia-cufft-cu12==11.4.1.4
78-
nvidia-cufile-cu12==1.14.1.1
79-
nvidia-curand-cu12==10.3.10.19
80-
nvidia-cusolver-cu12==11.7.5.82
81-
nvidia-cusparse-cu12==12.5.10.65
77+
nvidia-cufft-cu12==11.3.3.83
78+
nvidia-cufile-cu12==1.13.1.3
79+
nvidia-curand-cu12==10.3.9.90
80+
nvidia-cusolver-cu12==11.7.3.90
81+
nvidia-cusparse-cu12==12.5.8.93
8282
nvidia-cusparselt-cu12==0.7.1
8383
nvidia-nccl-cu12==2.27.5
84-
nvidia-nvjitlink-cu12==12.9.86
84+
nvidia-nvjitlink-cu12==12.8.93
8585
nvidia-nvshmem-cu12==3.3.20
86-
nvidia-nvtx-cu12==12.9.79
86+
nvidia-nvtx-cu12==12.8.90
8787
openai==1.90.0
8888
opencv-python-headless==4.12.0.88
8989
outlines_core==0.2.10
9090
packaging==25.0
9191
partial-json-parser==0.2.1.1.post6
92-
pillow==11.3.0
92+
pillow==12.0.0
9393
prometheus-fastapi-instrumentator==7.1.0
9494
prometheus_client==0.23.1
9595
propcache==0.4.1
96-
protobuf==6.32.1
96+
protobuf==6.33.0
9797
psutil==7.1.0
9898
py-cpuinfo==9.0.0
9999
pybase64==1.4.2
100100
pycountry==24.6.1
101101
pycparser==2.23
102-
pydantic==2.12.0
102+
pydantic==2.12.3
103103
pydantic-extra-types==2.10.6
104-
pydantic_core==2.41.1
104+
pydantic_core==2.41.4
105105
Pygments==2.19.2
106106
python-dotenv==1.1.1
107107
python-json-logger==4.0.0
108108
python-multipart==0.0.20
109-
pytorch-triton==3.4.0+gitf7888497
110109
PyYAML==6.0.3
111110
pyzmq==27.1.0
112-
ray==2.49.2
113-
referencing==0.36.2
111+
ray==2.50.0
112+
referencing==0.37.0
114113
regex==2025.9.18
115114
requests==2.32.5
116115
rich==14.2.0
117116
rich-toolkit==0.15.1
118-
rignore==0.7.0
117+
rignore==0.7.1
119118
rpds-py==0.27.1
120119
safetensors==0.6.2
121120
scipy==1.15.3
122121
sentencepiece==0.2.1
123-
sentry-sdk==2.41.0
124-
setuptools-scm==9.2.0
122+
sentry-sdk==2.42.0
123+
setuptools-scm==9.2.1
125124
shellingham==1.5.4
126125
sniffio==1.3.1
127126
soundfile==0.13.1
@@ -131,17 +130,17 @@ sympy==1.14.0
131130
tiktoken==0.12.0
132131
tokenizers==0.22.1
133132
tomli==2.3.0
134-
torch==2.9.0.dev20250905+cu129
133+
torch==2.9.0+cu128
135134
tqdm==4.67.1
136-
transformers==4.57.0
137-
triton==3.4.0
135+
transformers==4.57.1
136+
triton==3.5.0
138137
typer==0.19.2
139138
typing-inspection==0.4.2
140139
typing_extensions==4.15.0
141140
urllib3==2.5.0
142141
uvicorn==0.37.0
143-
uvloop==0.21.0
144-
watchfiles==1.1.0
142+
uvloop==0.22.1
143+
watchfiles==1.1.1
145144
websockets==15.0.1
146145
xgrammar==0.1.21
147146
yarl==1.22.0

.github/workflows/build_vllm.yaml

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -12,15 +12,15 @@ permissions:
1212

1313
jobs:
1414
build:
15-
name: forge-cu129-nightly
16-
uses: pytorch/test-infra/.github/workflows/build_wheels_linux.yml@main
15+
name: forge-cu128-nightly
16+
uses: pytorch/test-infra/.github/workflows/build_wheels_linux.yml@vllm-push
1717
strategy:
1818
fail-fast: false
1919
with:
2020
repository: meta-pytorch/forge
2121
ref: ""
2222
test-infra-repository: pytorch/test-infra
23-
test-infra-ref: main
23+
test-infra-ref: vllm-push
2424
run-smoke-test: false
2525
wheel-nightly-policy: gha_workflow_preview_build_wheels
2626
wheel-upload-path: whl/preview/forge/
@@ -31,13 +31,13 @@ jobs:
3131
{
3232
"python_version": "3.10",
3333
"gpu_arch_type": "cpu",
34-
"gpu_arch_version": "12.9",
35-
"desired_cuda": "cu129",
36-
"container_image": "pytorch/manylinux2_28-builder:cuda12.9",
34+
"gpu_arch_version": "12.8",
35+
"desired_cuda": "cu128",
36+
"container_image": "pytorch/manylinux2_28-builder:cuda12.8",
3737
"package_type": "manywheel",
38-
"build_name": "manywheel-py3_10-cuda12_9",
38+
"build_name": "manywheel-py3_10-cuda12_8",
3939
"validation_runner": "linux.12xlarge.memory",
40-
"installation": "pip3 install --pre torch torchvision torchaudio --index-url https://download.pytorch.org/whl/nightly/cu129",
40+
"installation": "pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128",
4141
"channel": "nightly",
4242
"upload_to_base_bucket": "no",
4343
"stable_version": "2.8.0",

0 commit comments

Comments
 (0)