Removed temporary patch for NVFP4 quants support as it's been merged into main

2025-11-25 12:48:58 -08:00
parent a93bd56389
commit a96a3a2dac
1 changed files with 2 additions and 2 deletions
--- a/4
+++ b/4
@@ -75,8 +75,8 @@ RUN python3 use_existing_torch.py && \
    sed -i "/flashinfer/d" requirements/cuda.txt && \
    pip install -r requirements/build.txt
-# TEMPORARY - apply NVFP4 patch
+# TEMPORARY - apply NVFP4 patch - MERGED ON 11/25/2025 - TODO: test and remove from Dockerfile
-RUN curl -L https://patch-diff.githubusercontent.com/raw/vllm-project/vllm/pull/29242.diff | git apply
+# RUN curl -L https://patch-diff.githubusercontent.com/raw/vllm-project/vllm/pull/29242.diff | git apply
 # Final Build
 # Uses --no-build-isolation to respect the pre-installed Torch/FlashInfer