Bumped base image version; reverted Triton to 3.5.1

This commit is contained in:
Eugene Rakhmatulin
2026-01-29 23:14:43 -08:00
parent ace61c2d55
commit ef0f996df6
4 changed files with 7 additions and 6 deletions

View File

@@ -6,7 +6,7 @@ ARG BUILD_JOBS=16
# ========================================================= # =========================================================
# STAGE 1: Base Image (Installs Dependencies) # STAGE 1: Base Image (Installs Dependencies)
# ========================================================= # =========================================================
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04 AS base FROM nvidia/cuda:13.1.1-devel-ubuntu24.04 AS base
# Build parallemism # Build parallemism
ARG BUILD_JOBS ARG BUILD_JOBS
@@ -102,7 +102,7 @@ RUN git clone https://github.com/triton-lang/triton.git
# We expect TRITON_REF to be passed from the command line to break the cache # We expect TRITON_REF to be passed from the command line to break the cache
# Set to v3.5.1 tag by default # Set to v3.5.1 tag by default
ARG TRITON_REF=v3.6.0 ARG TRITON_REF=v3.5.1
WORKDIR $VLLM_BASE_DIR/triton WORKDIR $VLLM_BASE_DIR/triton
@@ -193,7 +193,7 @@ RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
# ========================================================= # =========================================================
# STAGE 4: Runner (Transfers only necessary artifacts) # STAGE 4: Runner (Transfers only necessary artifacts)
# ========================================================= # =========================================================
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04 AS runner FROM nvidia/cuda:13.1.1-devel-ubuntu24.04 AS runner
ENV DEBIAN_FRONTEND=noninteractive ENV DEBIAN_FRONTEND=noninteractive
ENV PIP_BREAK_SYSTEM_PACKAGES=1 ENV PIP_BREAK_SYSTEM_PACKAGES=1

View File

@@ -258,7 +258,8 @@ RUN mkdir -p tiktoken_encodings && \
# No need to copy source code, as it's already in the site-packages # No need to copy source code, as it's already in the site-packages
COPY --from=builder /workspace/wheels /workspace/wheels COPY --from=builder /workspace/wheels /workspace/wheels
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \ RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
uv pip install /workspace/wheels/*.whl uv pip install /workspace/wheels/*.whl && \
rm -rf /workspace/wheels
# Setup Env for Runtime # Setup Env for Runtime
ENV TORCH_CUDA_ARCH_LIST="12.0;12.1" ENV TORCH_CUDA_ARCH_LIST="12.0;12.1"

View File

@@ -1,6 +1,6 @@
# syntax=docker/dockerfile:1.6 # syntax=docker/dockerfile:1.6
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04 FROM nvidia/cuda:13.1.1-devel-ubuntu24.04
ENV DEBIAN_FRONTEND=noninteractive ENV DEBIAN_FRONTEND=noninteractive
ENV PIP_BREAK_SYSTEM_PACKAGES=1 ENV PIP_BREAK_SYSTEM_PACKAGES=1

View File

@@ -11,7 +11,7 @@ REBUILD_VLLM=false
COPY_HOSTS=() COPY_HOSTS=()
SSH_USER="$USER" SSH_USER="$USER"
NO_BUILD=false NO_BUILD=false
TRITON_REF="v3.6.0" TRITON_REF="v3.5.1"
VLLM_REF="main" VLLM_REF="main"
TMP_IMAGE="" TMP_IMAGE=""
PARALLEL_COPY=false PARALLEL_COPY=false