Skip to content

Commit 2ad555c

Browse files
committed
chore: Use exact commit hash for Triton from vLLM PR
1 parent 9c74a08 commit 2ad555c

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

vllm-tensorizer/Dockerfile

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -71,7 +71,7 @@ RUN git clone --filter=tree:0 --no-single-branch --no-checkout \
7171

7272
FROM alpine/git:2.36.3 AS triton-downloader
7373
WORKDIR /git
74-
ARG TRITON_COMMIT='v3.4.0'
74+
ARG TRITON_COMMIT='663e04e8e3ebed7ee3230a1a7320142689795106'
7575
RUN git clone --filter=tree:0 --no-single-branch --no-checkout \
7676
https://github.com/openai/triton.git && \
7777
cd triton && \
@@ -124,6 +124,7 @@ RUN --mount=type=bind,from=flashinfer-downloader,source=/git/flashinfer,target=/
124124
export TORCH_CUDA_ARCH_LIST="$(echo "${TORCH_CUDA_ARCH_LIST}" | sed 's@[67]\.0 \+@@g')" && \
125125
sed -i 's@torch\.cuda\.get_device_capability()@(12, 0)@' flashinfer/comm/trtllm_ar.py && \
126126
python3 -m flashinfer.aot && \
127+
python3 -m flashinfer.aot && \
127128
python3 -m pip wheel -w /wheels \
128129
-v --no-cache-dir --no-build-isolation --no-deps \
129130
-c /opt/constraints.txt \

0 commit comments

Comments
 (0)