Implemented a temporary patch for recently broken MiniMax-M2 (in builds after 12/10) for some quants.

2025-12-11 11:13:05 -08:00
parent 9d351cd6d5
commit 5fba205db4
2 changed files with 8 additions and 0 deletions
--- a/3
+++ b/3
@@ -80,6 +80,9 @@ RUN python3 use_existing_torch.py && \
 COPY fastsafetensors.patch .
 RUN patch -p1 < fastsafetensors.patch

+# TEMPORARY PATCH for broken MiniMax M2 - tracking https://github.com/vllm-project/vllm/issues/30445 and https://github.com/vllm-project/vllm/pull/30389
+RUN curl -L https://patch-diff.githubusercontent.com/raw/vllm-project/vllm/pull/30389.diff | git apply
+
 # Final Build
 # Uses --no-build-isolation to respect the pre-installed Torch/FlashInfer
 RUN pip install --no-build-isolation . -v