From 37953478f0dd85049e8f0fe6d617452e8c7f5386 Mon Sep 17 00:00:00 2001 From: Eugene Rakhmatulin Date: Mon, 2 Feb 2026 09:21:48 -0800 Subject: [PATCH] changed arch codes again to be in line with upcoming PR --- Dockerfile | 8 ++++---- Dockerfile.mxfp4 | 8 ++++---- 2 files changed, 8 insertions(+), 8 deletions(-) diff --git a/Dockerfile b/Dockerfile index 12c3fd4..2980c2b 100644 --- a/Dockerfile +++ b/Dockerfile @@ -55,7 +55,7 @@ ENV CMAKE_CUDA_COMPILER_LAUNCHER=ccache WORKDIR $VLLM_BASE_DIR # 2. Set Environment Variables -ENV TORCH_CUDA_ARCH_LIST=12.1a +ENV TORCH_CUDA_ARCH_LIST=12.1f ENV TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas # ========================================================= @@ -90,7 +90,7 @@ FROM base AS builder # ======= FlashInfer Build ========== -ENV FLASHINFER_CUDA_ARCH_LIST="12.1a" +ENV FLASHINFER_CUDA_ARCH_LIST="12.1f" WORKDIR $VLLM_BASE_DIR ARG FLASHINFER_REF=main @@ -265,8 +265,8 @@ RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \ fi # Setup Env for Runtime -ENV TORCH_CUDA_ARCH_LIST=12.1a -ENV FLASHINFER_CUDA_ARCH_LIST="12.1a" +ENV TORCH_CUDA_ARCH_LIST=12.1f +ENV FLASHINFER_CUDA_ARCH_LIST="12.1f" ENV TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas ENV TIKTOKEN_ENCODINGS_BASE=$VLLM_BASE_DIR/tiktoken_encodings ENV PATH=$VLLM_BASE_DIR:$PATH diff --git a/Dockerfile.mxfp4 b/Dockerfile.mxfp4 index 6863a98..2a27f7b 100644 --- a/Dockerfile.mxfp4 +++ b/Dockerfile.mxfp4 @@ -67,7 +67,7 @@ ENV CMAKE_CUDA_COMPILER_LAUNCHER=ccache WORKDIR $VLLM_BASE_DIR # 2. Set Environment Variables -ENV TORCH_CUDA_ARCH_LIST="12.1a" +ENV TORCH_CUDA_ARCH_LIST="12.1f" ENV TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas # --- CACHE BUSTER --- @@ -88,7 +88,7 @@ RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \ # ========================================================= FROM base AS builder -ENV FLASHINFER_CUDA_ARCH_LIST="12.1a" +ENV FLASHINFER_CUDA_ARCH_LIST="12.1f" WORKDIR $VLLM_BASE_DIR @@ -261,8 +261,8 @@ RUN --mount=type=bind,from=builder,source=/workspace/wheels,target=/mount/wheels uv pip install /mount/wheels/*.whl # Setup Env for Runtime -ENV TORCH_CUDA_ARCH_LIST="12.1a" -ENV FLASHINFER_CUDA_ARCH_LIST="12.1a" +ENV TORCH_CUDA_ARCH_LIST="12.1f" +ENV FLASHINFER_CUDA_ARCH_LIST="12.1f" ENV TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas ENV TIKTOKEN_ENCODINGS_BASE=$VLLM_BASE_DIR/tiktoken_encodings ENV PATH=$VLLM_BASE_DIR:$PATH