File tree Expand file tree Collapse file tree 1 file changed +6
-2
lines changed Expand file tree Collapse file tree 1 file changed +6
-2
lines changed Original file line number Diff line number Diff line change @@ -501,8 +501,12 @@ COPY --from=dev /workspace/target/release/metrics /usr/local/bin/metrics
501501# NOTE: If a package (tensorrt_llm) exists on both --index-url and --extra-index-url,
502502# uv will prioritize the --extra-index-url, unless --index-strategy unsafe-best-match
503503# is also specified. So set the configurable index as a --extra-index-url for prioritization.
504- # locking triton version to 3.3.1 as 3.4.0 breaks tensorrt-llm 1.0.0rc4
505- RUN uv pip install --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${TENSORRTLLM_PIP_WHEEL}" && \
504+ # NOTE: locking triton version to 3.3.1 as 3.4.0 breaks tensorrt-llm 1.0.0rc4
505+ # NOTE: locking cuda-python version to <13 to avoid breaks with tensorrt-llm 1.0.0rc4. This
506+ # can be removed after https://github.com/NVIDIA/TensorRT-LLM/pull/6703 is merged
507+ # we upgrade to a published pip wheel containing this change.
508+ RUN uv pip install "cuda-python>=12,<13" && \
509+ uv pip install --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${TENSORRTLLM_PIP_WHEEL}" && \
506510 if [ "$ARCH" = "amd64" ]; then \
507511 pip install "triton==3.3.1"; \
508512 fi; \
You can’t perform that action at this time.
0 commit comments