diff --git a/Dockerfile b/Dockerfile index 3f4ace6..eda1ce8 100644 --- a/Dockerfile +++ b/Dockerfile @@ -122,25 +122,15 @@ RUN if [ -n "$FLASHINFER_PRS" ]; then \ done; \ fi -# TEMPORARY patch for NVFP4 crash (PR 2913) -RUN curl -fsL https://github.com/flashinfer-ai/flashinfer/pull/2913.diff -o pr2913.diff \ - && if git apply --reverse --check pr2913.diff 2>/dev/null; then \ - echo "PR #2913 already applied, skipping."; \ +# TEMPORARY patch for flashinfer autotune and other improvements (PR 2927) +RUN curl -fsL https://github.com/flashinfer-ai/flashinfer/pull/2927.diff -o pr2927.diff \ + && if git apply --reverse --check pr2927.diff 2>/dev/null; then \ + echo "PR #2927 already applied, skipping."; \ else \ - echo "Applying FI PR #2913..."; \ - git apply -v pr2913.diff; \ + echo "Applying FI PR #2927..."; \ + git apply -v pr2927.diff; \ fi \ - && rm pr2913.diff - -# TEMPORARY patch for flashinfer autotune and other improvements (PR 2897) -RUN curl -fsL https://github.com/flashinfer-ai/flashinfer/pull/2897.diff -o pr2897.diff \ - && if git apply --reverse --check pr2897.diff 2>/dev/null; then \ - echo "PR #2897 already applied, skipping."; \ - else \ - echo "Applying FI PR #2897..."; \ - git apply -v pr2897.diff; \ - fi \ - && rm pr2897.diff + && rm pr2927.diff # Apply patch to avoid re-downloading existing cubins COPY flashinfer_cache.patch .