Skip to content

Commit b8e0b2a

Browse files
committed
chore: Attempt initial build
1 parent 8552fbc commit b8e0b2a

File tree

2 files changed

+30
-1
lines changed

2 files changed

+30
-1
lines changed

.github/configurations/vllm-tensorizer.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
vllm-commit:
2-
- 'v0.10.0'
2+
- '8260948cdc379d13bf4b80d3172a03d21a983e05'
33
flashinfer-commit:
44
- 'v0.2.8'
55
builder-base-image:

vllm-tensorizer/Dockerfile

Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -69,6 +69,15 @@ RUN git clone --filter=tree:0 --no-single-branch --no-checkout \
6969
git submodule update --init --recursive --jobs 8 \
7070
--depth 1 --filter=tree:0
7171

72+
FROM alpine/git:2.36.3 AS triton-downloader
73+
WORKDIR /git
74+
ARG TRITON_COMMIT='v3.4.0'
75+
RUN git clone --filter=tree:0 --no-single-branch --no-checkout \
76+
https://github.com/openai/triton.git && \
77+
cd triton && \
78+
git checkout "${TRITON_COMMIT}" && \
79+
git submodule update --init --recursive --jobs 8 \
80+
--depth 1 --filter=tree:0
7281

7382
FROM alpine/git:2.36.3 AS lmcache-downloader
7483
WORKDIR /git
@@ -122,6 +131,21 @@ RUN --mount=type=bind,from=flashinfer-downloader,source=/git/flashinfer,target=/
122131

123132
WORKDIR /wheels
124133

134+
FROM builder-base AS triton-builder
135+
RUN --mount=type=bind,from=triton-downloader,source=/git/triton,target=/workspace,rw \
136+
. /opt/arch_flags.sh && \
137+
pip install --no-cache-dir -r python/requirements.txt && \
138+
python3 -m pip wheel -w /wheels \
139+
-v --no-cache-dir --no-build-isolation --no-deps \
140+
-c /opt/constraints.txt \
141+
./ && \
142+
python3 -m pip wheel -w /wheels \
143+
-v --no-cache-dir --no-build-isolation --no-deps \
144+
-c /opt/constraints.txt \
145+
python/triton_kernels
146+
147+
WORKDIR /wheels
148+
125149

126150
FROM builder-base AS lmcache-builder
127151
# LMCache must be built from source as it doesn't have pre-built ARM binaries
@@ -170,13 +194,18 @@ RUN --mount=type=bind,from=vllm-builder,source=/wheels,target=/tmp/wheels \
170194
RUN --mount=type=bind,from=flashinfer-builder,source=/wheels,target=/tmp/wheels \
171195
python3 -m pip install --no-cache-dir /tmp/wheels/*.whl -c /tmp/constraints.txt
172196

197+
RUN --mount=type=bind,from=triton-builder,source=/wheels,target=/tmp/wheels \
198+
python3 -m pip install --no-cache-dir /tmp/wheels/*.whl -c /tmp/constraints.txt
199+
173200
# InfiniStore must be installed before LMCache as LMCache depends on InfiniStore
174201
RUN --mount=type=bind,from=infinistore-builder,source=/wheels,target=/tmp/wheels \
175202
python3 -m pip install --no-cache-dir /tmp/wheels/*.whl -c /tmp/constraints.txt
176203

177204
RUN --mount=type=bind,from=lmcache-builder,source=/wheels,target=/tmp/wheels \
178205
python3 -m pip install --no-cache-dir /tmp/wheels/*.whl -c /tmp/constraints.txt
179206

207+
RUN python3 -m pip install --no-cache-dir "transformers==4.54.1" -c /tmp/constraints.txt
208+
180209
# Copied from vLLM's Dockerfile
181210
ARG TARGETPLATFORM
182211

0 commit comments

Comments
 (0)