File tree Expand file tree Collapse file tree 1 file changed +6
-2
lines changed Expand file tree Collapse file tree 1 file changed +6
-2
lines changed Original file line number Diff line number Diff line change @@ -501,8 +501,12 @@ COPY --from=dev /workspace/target/release/metrics /usr/local/bin/metrics
501
501
# NOTE: If a package (tensorrt_llm) exists on both --index-url and --extra-index-url,
502
502
# uv will prioritize the --extra-index-url, unless --index-strategy unsafe-best-match
503
503
# is also specified. So set the configurable index as a --extra-index-url for prioritization.
504
- # locking triton version to 3.3.1 as 3.4.0 breaks tensorrt-llm 1.0.0rc4
505
- RUN uv pip install --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${TENSORRTLLM_PIP_WHEEL}" && \
504
+ # NOTE: locking triton version to 3.3.1 as 3.4.0 breaks tensorrt-llm 1.0.0rc4
505
+ # NOTE: locking cuda-python version to <13 to avoid breaks with tensorrt-llm 1.0.0rc4. This
506
+ # can be removed after https://github.com/NVIDIA/TensorRT-LLM/pull/6703 is merged
507
+ # we upgrade to a published pip wheel containing this change.
508
+ RUN uv pip install "cuda-python>=12,<13" && \
509
+ uv pip install --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${TENSORRTLLM_PIP_WHEEL}" && \
506
510
if [ "$ARCH" = "amd64" ]; then \
507
511
pip install "triton==3.3.1"; \
508
512
fi; \
You can’t perform that action at this time.
0 commit comments