diff --git a/Dockerfile.wheels b/Dockerfile.wheels index 4c6e964..da6ed1f 100644 --- a/Dockerfile.wheels +++ b/Dockerfile.wheels @@ -63,9 +63,9 @@ RUN patch -p1 -d /usr/local/lib/python3.12/dist-packages < ${VLLM_BASE_DIR}/fast # Install flashinfer helper packages RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \ - uv pip install --system --break-system-packages flashinfer-python -U --no-deps --pre --index-url https://flashinfer.ai/whl && \ - uv pip install --system --break-system-packages flashinfer-cubin --pre --index-url https://flashinfer.ai/whl && \ - uv pip install --system --break-system-packages flashinfer-jit-cache --pre --index-url https://flashinfer.ai/whl/cu130 + uv pip install --system --break-system-packages flashinfer-python -U --no-deps --index-url https://flashinfer.ai/whl && \ + uv pip install --system --break-system-packages flashinfer-cubin --index-url https://flashinfer.ai/whl && \ + uv pip install --system --break-system-packages flashinfer-jit-cache --index-url https://flashinfer.ai/whl/cu130 # Setup Env for Runtime ENV TORCH_CUDA_ARCH_LIST=12.1a