diff --git a/Dockerfile b/Dockerfile index 93492c2..12d850e 100644 --- a/Dockerfile +++ b/Dockerfile @@ -316,7 +316,7 @@ ARG PRE_TRANSFORMERS=0 # Install deps RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \ uv pip install torch==2.11.0 torchvision torchaudio triton --index-url https://download.pytorch.org/whl/cu130 && \ - uv pip install nvidia-nvshmem-cu13 "apache-tvm-ffi<0.2" nvidia-cutlass-dsl-libs-cu13 + uv pip install nvidia-nvshmem-cu13 "apache-tvm-ffi<0.2" # Install wheels from host ./wheels/ (bind-mounted from build context — no layer bloat) # With --tf5: override vLLM's transformers<5 constraint to get transformers>=5