Bumped base image version; reverted Triton to 3.5.1
This commit is contained in:
@@ -6,7 +6,7 @@ ARG BUILD_JOBS=16
|
|||||||
# =========================================================
|
# =========================================================
|
||||||
# STAGE 1: Base Image (Installs Dependencies)
|
# STAGE 1: Base Image (Installs Dependencies)
|
||||||
# =========================================================
|
# =========================================================
|
||||||
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04 AS base
|
FROM nvidia/cuda:13.1.1-devel-ubuntu24.04 AS base
|
||||||
|
|
||||||
# Build parallemism
|
# Build parallemism
|
||||||
ARG BUILD_JOBS
|
ARG BUILD_JOBS
|
||||||
@@ -102,7 +102,7 @@ RUN git clone https://github.com/triton-lang/triton.git
|
|||||||
|
|
||||||
# We expect TRITON_REF to be passed from the command line to break the cache
|
# We expect TRITON_REF to be passed from the command line to break the cache
|
||||||
# Set to v3.5.1 tag by default
|
# Set to v3.5.1 tag by default
|
||||||
ARG TRITON_REF=v3.6.0
|
ARG TRITON_REF=v3.5.1
|
||||||
|
|
||||||
WORKDIR $VLLM_BASE_DIR/triton
|
WORKDIR $VLLM_BASE_DIR/triton
|
||||||
|
|
||||||
@@ -193,7 +193,7 @@ RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
|
|||||||
# =========================================================
|
# =========================================================
|
||||||
# STAGE 4: Runner (Transfers only necessary artifacts)
|
# STAGE 4: Runner (Transfers only necessary artifacts)
|
||||||
# =========================================================
|
# =========================================================
|
||||||
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04 AS runner
|
FROM nvidia/cuda:13.1.1-devel-ubuntu24.04 AS runner
|
||||||
|
|
||||||
ENV DEBIAN_FRONTEND=noninteractive
|
ENV DEBIAN_FRONTEND=noninteractive
|
||||||
ENV PIP_BREAK_SYSTEM_PACKAGES=1
|
ENV PIP_BREAK_SYSTEM_PACKAGES=1
|
||||||
|
|||||||
@@ -258,7 +258,8 @@ RUN mkdir -p tiktoken_encodings && \
|
|||||||
# No need to copy source code, as it's already in the site-packages
|
# No need to copy source code, as it's already in the site-packages
|
||||||
COPY --from=builder /workspace/wheels /workspace/wheels
|
COPY --from=builder /workspace/wheels /workspace/wheels
|
||||||
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
|
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
|
||||||
uv pip install /workspace/wheels/*.whl
|
uv pip install /workspace/wheels/*.whl && \
|
||||||
|
rm -rf /workspace/wheels
|
||||||
|
|
||||||
# Setup Env for Runtime
|
# Setup Env for Runtime
|
||||||
ENV TORCH_CUDA_ARCH_LIST="12.0;12.1"
|
ENV TORCH_CUDA_ARCH_LIST="12.0;12.1"
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
# syntax=docker/dockerfile:1.6
|
# syntax=docker/dockerfile:1.6
|
||||||
|
|
||||||
FROM nvidia/cuda:13.1.0-devel-ubuntu24.04
|
FROM nvidia/cuda:13.1.1-devel-ubuntu24.04
|
||||||
|
|
||||||
ENV DEBIAN_FRONTEND=noninteractive
|
ENV DEBIAN_FRONTEND=noninteractive
|
||||||
ENV PIP_BREAK_SYSTEM_PACKAGES=1
|
ENV PIP_BREAK_SYSTEM_PACKAGES=1
|
||||||
|
|||||||
@@ -11,7 +11,7 @@ REBUILD_VLLM=false
|
|||||||
COPY_HOSTS=()
|
COPY_HOSTS=()
|
||||||
SSH_USER="$USER"
|
SSH_USER="$USER"
|
||||||
NO_BUILD=false
|
NO_BUILD=false
|
||||||
TRITON_REF="v3.6.0"
|
TRITON_REF="v3.5.1"
|
||||||
VLLM_REF="main"
|
VLLM_REF="main"
|
||||||
TMP_IMAGE=""
|
TMP_IMAGE=""
|
||||||
PARALLEL_COPY=false
|
PARALLEL_COPY=false
|
||||||
|
|||||||
Reference in New Issue
Block a user