diff --git a/Dockerfile b/Dockerfile index 3c19eb8..d8306ce 100644 --- a/Dockerfile +++ b/Dockerfile @@ -291,6 +291,10 @@ RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \ uv pip install ray[default] fastsafetensors # Cleanup + +# Remove triton-kernels as they are not compatible with this vLLM version yet +RUN uv pip uninstall triton-kernels + # RUN uv pip uninstall absl-py apex argon2-cffi \ # argon2-cffi-bindings arrow asttokens astunparse async-lru audioread babel beautifulsoup4 \ # black bleach comm contourpy cycler datasets debugpy decorator defusedxml dllist dm-tree \ diff --git a/Dockerfile.wheels b/Dockerfile.wheels index 8311661..d473693 100644 --- a/Dockerfile.wheels +++ b/Dockerfile.wheels @@ -95,6 +95,11 @@ ENV TIKTOKEN_ENCODINGS_BASE=$VLLM_BASE_DIR/tiktoken_encodings COPY run-cluster-node.sh $VLLM_BASE_DIR/ RUN chmod +x $VLLM_BASE_DIR/run-cluster-node.sh +# Cleanup + +# Remove triton-kernels as they are not compatible with this vLLM version yet +RUN uv pip uninstall triton-kernels + # Cleanup unneeded packages to reduce image size # RUN uv pip uninstall absl-py apex argon2-cffi \ # argon2-cffi-bindings arrow asttokens astunparse async-lru audioread babel beautifulsoup4 \