File tree Expand file tree Collapse file tree 2 files changed +29
-28
lines changed Expand file tree Collapse file tree 2 files changed +29
-28
lines changed Original file line number Diff line number Diff line change 9
9
IMAGE : zappi/vllm-openai
10
10
11
11
jobs :
12
+ build-triton-wheel-arm64 :
13
+ runs-on : ubuntu-24.04-arm
14
+ concurrency : arm64
15
+ steps :
16
+ - name : Build wheels
17
+
18
+ env :
19
+ CIBW_BEFORE_ALL : " dnf install clang lld -y"
20
+ CIBW_BUILD : " cp312-manylinux_aarch64"
21
+ CIBW_ENVIRONMENT : " MAX_JOBS=4 TRITON_BUILD_WITH_CLANG_LLD=1"
22
+ with :
23
+ package-dir : python
24
+ output-dir : wheelhouse
25
+ - name : Upload wheels
26
+ uses : actions/upload-artifact@v4
27
+ with :
28
+ name : triton-wheels-linux-arm64
29
+ path : ./wheelhouse/*.whl
30
+
12
31
build-amd64 :
13
32
runs-on : ubuntu-latest
14
33
concurrency : amd64
49
68
50
69
build-arm64 :
51
70
runs-on : ubuntu-latest
71
+ needs : build-triton-wheel-arm64
52
72
concurrency : arm64
53
73
steps :
54
74
- name : Free additional disk space
66
86
df -h
67
87
- name : Checkout
68
88
uses : actions/checkout@v4
89
+ - name : Download a single artifact
90
+ uses : actions/download-artifact@v5
91
+ with :
92
+ name : triton-wheels-linux-arm64
93
+ path : ./wheelhouse/
69
94
- name : Prepare image metadata
70
95
id : metadata
71
96
uses : docker/metadata-action@v5
Original file line number Diff line number Diff line change 1
- FROM python:3.12-slim AS triton-builder
1
+ FROM vllm/vllm-openai:v0.10.2
2
2
3
- RUN apt-get update -qq && \
4
- apt-get install -qq -y \
5
- build-essential \
6
- clang \
7
- cmake \
8
- git \
9
- lld \
10
- llvm && \
11
- rm -rf /var/lib/apt/lists/*
12
-
13
- RUN git clone https://github.com/triton-lang/triton.git /tmp/triton \
14
- --depth 1 \
15
- --branch v3.2.0
16
-
17
- ARG TRITON_BUILD_WITH_CLANG_LLD=true
18
- RUN --mount=type=cache,target=/root/.cache/pip \
19
- cd /tmp/triton && \
20
- pip install ninja cmake wheel pybind11 && \
21
- pip wheel ./python --wheel-dir /tmp/wheels
22
-
23
- FROM vllm/vllm-openai:v0.10.2 AS final
24
-
25
- COPY --from=triton-builder /tmp/wheels/*.whl /tmp/wheels/
26
-
27
- RUN --mount=type=cache,target=/root/.cache/uv \
28
- uv pip install --system /tmp/wheels/*.whl && \
29
- rm -rf /tmp/wheels
3
+ RUN --mount=type=bind,source=./wheelhouse,target=/wheelhouse \
4
+ --mount=type=cache,target=/root/.cache/uv \
5
+ uv pip install --system /wheelhouse/*.whl
You can’t perform that action at this time.
0 commit comments