Bumped base image version; reverted Triton to 3.5.1

This commit is contained in:
Eugene Rakhmatulin
2026-01-29 23:14:43 -08:00
parent ace61c2d55
commit ef0f996df6
4 changed files with 7 additions and 6 deletions

View File

@@ -6,7 +6,7 @@ ARG BUILD_JOBS=16
# =========================================================
# STAGE 1: Base Image (Installs Dependencies)
# =========================================================
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04 AS base
FROM nvidia/cuda:13.1.1-devel-ubuntu24.04 AS base
# Build parallemism
ARG BUILD_JOBS
@@ -102,7 +102,7 @@ RUN git clone https://github.com/triton-lang/triton.git
# We expect TRITON_REF to be passed from the command line to break the cache
# Set to v3.5.1 tag by default
ARG TRITON_REF=v3.6.0
ARG TRITON_REF=v3.5.1
WORKDIR $VLLM_BASE_DIR/triton
@@ -193,7 +193,7 @@ RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
# =========================================================
# STAGE 4: Runner (Transfers only necessary artifacts)
# =========================================================
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04 AS runner
FROM nvidia/cuda:13.1.1-devel-ubuntu24.04 AS runner
ENV DEBIAN_FRONTEND=noninteractive
ENV PIP_BREAK_SYSTEM_PACKAGES=1

View File

@@ -258,7 +258,8 @@ RUN mkdir -p tiktoken_encodings && \
# No need to copy source code, as it's already in the site-packages
COPY --from=builder /workspace/wheels /workspace/wheels
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
uv pip install /workspace/wheels/*.whl
uv pip install /workspace/wheels/*.whl && \
rm -rf /workspace/wheels
# Setup Env for Runtime
ENV TORCH_CUDA_ARCH_LIST="12.0;12.1"

View File

@@ -1,6 +1,6 @@
# syntax=docker/dockerfile:1.6
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04
FROM nvidia/cuda:13.1.1-devel-ubuntu24.04
ENV DEBIAN_FRONTEND=noninteractive
ENV PIP_BREAK_SYSTEM_PACKAGES=1

View File

@@ -11,7 +11,7 @@ REBUILD_VLLM=false
COPY_HOSTS=()
SSH_USER="$USER"
NO_BUILD=false
TRITON_REF="v3.6.0"
TRITON_REF="v3.5.1"
VLLM_REF="main"
TMP_IMAGE=""
PARALLEL_COPY=false