Pin nvidia-nvshmem-cu13 to <3.6 in Dockerfile.mxfp4
nvidia-nvshmem-cu13 3.6.5 (released Mar 24) introduced a breaking change — nvshmemi_device_state_d was removed from NVSHMEM headers, which breaks FlashInfer AOT compilation of nvshmem_binding.cu.
This commit is contained in:
@@ -101,7 +101,7 @@ ARG FLASHINFER_SHA=f349e52496a72a00d8c4ac02c7a1e38523ff7194
|
|||||||
ARG CUTLASS_SHA=c7516ad20f3d022fdbc93e9468643bf3b577e02c
|
ARG CUTLASS_SHA=c7516ad20f3d022fdbc93e9468643bf3b577e02c
|
||||||
|
|
||||||
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
|
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
|
||||||
uv pip install nvidia-nvshmem-cu13 "apache-tvm-ffi<0.2"
|
uv pip install "nvidia-nvshmem-cu13<3.6" "apache-tvm-ffi<0.2"
|
||||||
|
|
||||||
# Clone FlashInfer (cached for faster rebuilds)
|
# Clone FlashInfer (cached for faster rebuilds)
|
||||||
RUN --mount=type=cache,id=git-flashinfer,target=/git-cache/flashinfer \
|
RUN --mount=type=cache,id=git-flashinfer,target=/git-cache/flashinfer \
|
||||||
@@ -272,7 +272,7 @@ ENV PATH=$VLLM_BASE_DIR:$PATH
|
|||||||
|
|
||||||
# Final extra deps
|
# Final extra deps
|
||||||
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
|
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
|
||||||
uv pip install ray[default] fastsafetensors nvidia-nvshmem-cu13
|
uv pip install ray[default] fastsafetensors "nvidia-nvshmem-cu13<3.6"
|
||||||
|
|
||||||
# Build metadata (generated by build-and-copy.sh)
|
# Build metadata (generated by build-and-copy.sh)
|
||||||
COPY build-metadata.yaml /workspace/build-metadata.yaml
|
COPY build-metadata.yaml /workspace/build-metadata.yaml
|
||||||
|
|||||||
Reference in New Issue
Block a user