Skip to content

Commit 73bcc3b

Browse files
authored
fix(build): Pin cuda-python>=12,<13 to avoid trtllm breakage (#2379)
1 parent bd8e368 commit 73bcc3b

File tree

1 file changed

+6
-2
lines changed

1 file changed

+6
-2
lines changed

container/Dockerfile.tensorrt_llm

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -501,8 +501,12 @@ COPY --from=dev /workspace/target/release/metrics /usr/local/bin/metrics
501501
# NOTE: If a package (tensorrt_llm) exists on both --index-url and --extra-index-url,
502502
# uv will prioritize the --extra-index-url, unless --index-strategy unsafe-best-match
503503
# is also specified. So set the configurable index as a --extra-index-url for prioritization.
504-
# locking triton version to 3.3.1 as 3.4.0 breaks tensorrt-llm 1.0.0rc4
505-
RUN uv pip install --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${TENSORRTLLM_PIP_WHEEL}" && \
504+
# NOTE: locking triton version to 3.3.1 as 3.4.0 breaks tensorrt-llm 1.0.0rc4
505+
# NOTE: locking cuda-python version to <13 to avoid breaks with tensorrt-llm 1.0.0rc4. This
506+
# can be removed after https://github.com/NVIDIA/TensorRT-LLM/pull/6703 is merged
507+
# we upgrade to a published pip wheel containing this change.
508+
RUN uv pip install "cuda-python>=12,<13" && \
509+
uv pip install --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${TENSORRTLLM_PIP_WHEEL}" && \
506510
if [ "$ARCH" = "amd64" ]; then \
507511
pip install "triton==3.3.1"; \
508512
fi; \

0 commit comments

Comments
 (0)