Some optimizations

This commit is contained in:
Eugene Rakhmatulin
2026-01-29 22:08:05 -08:00
parent a5b693cc1e
commit 0ac438b4dd
3 changed files with 39 additions and 8 deletions

View File

@@ -1,6 +1,9 @@
# syntax=docker/dockerfile:1.6
FROM nvcr.io/nvidia/pytorch:26.01-py3
# =========================================================
# STAGE 1: Base Image (Installs Dependencies)
# =========================================================
FROM nvcr.io/nvidia/pytorch:26.01-py3 AS base
ENV DEBIAN_FRONTEND=noninteractive
ENV PIP_BREAK_SYSTEM_PACKAGES=1
@@ -42,7 +45,7 @@ COPY fastsafetensors.patch .
# Install fastsafetensors
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
uv pip install -U fastsafetensors
uv pip install -U fastsafetensors ray[default] "apache-tvm-ffi<0.2"
# --- VLLM SOURCE CACHE BUSTER ---
# Change THIS argument to force a fresh git clone and rebuild of vLLM
@@ -92,7 +95,17 @@ ENV TIKTOKEN_ENCODINGS_BASE=$VLLM_BASE_DIR/tiktoken_encodings
COPY run-cluster-node.sh $VLLM_BASE_DIR/
RUN chmod +x $VLLM_BASE_DIR/run-cluster-node.sh
# Final extra deps
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
uv pip install ray[default] fastsafetensors "apache-tvm-ffi<0.2"
# Cleanup unneeded packages to reduce image size
# RUN uv pip uninstall absl-py apex argon2-cffi \
# argon2-cffi-bindings arrow asttokens astunparse async-lru audioread babel beautifulsoup4 \
# black bleach comm contourpy cycler datasets debugpy decorator defusedxml dllist dm-tree \
# execnet executing expecttest fastjsonschema fonttools fqdn gast hypothesis \
# ipykernel ipython ipython_pygments_lexers isoduration isort jedi joblib jupyter-events \
# jupyter-lsp jupyter_client jupyter_core jupyter_server jupyter_server_terminals jupyterlab \
# jupyterlab_code_formatter jupyterlab_code_formatter jupyterlab_pygments jupyterlab_server \
# jupyterlab_tensorboard_pro jupytext kiwisolver matplotlib matplotlib-inline matplotlib-inline \
# mistune ml_dtypes mock nbclient nbconvert nbformat nest-asyncio notebook notebook_shim \
# opt_einsum optree outlines_core overrides pandas pandocfilters parso pexpect polygraphy pooch \
# pyarrow pycocotools pytest-flakefinder pytest-rerunfailures pytest-shard pytest-xdist \
# scikit-learn scipy Send2Trash soundfile soupsieve soxr spin stack-data \
# wcwidth webcolors xdoctest Werkzeug