Some optimizations

This commit is contained in:
Eugene Rakhmatulin
2026-01-29 22:08:05 -08:00
parent a5b693cc1e
commit 0ac438b4dd
3 changed files with 39 additions and 8 deletions

View File

@@ -258,7 +258,8 @@ RUN mkdir -p tiktoken_encodings && \
# No need to copy source code, as it's already in the site-packages
COPY --from=builder /workspace/wheels /workspace/wheels
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
uv pip install /workspace/wheels/*.whl
uv pip install /workspace/wheels/*.whl && \
rm -rf /workspace/wheels
# Setup Env for Runtime
ENV TORCH_CUDA_ARCH_LIST="12.0;12.1"
@@ -274,3 +275,4 @@ RUN chmod +x $VLLM_BASE_DIR/run-cluster-node.sh
# Final extra deps
RUN --mount=type=cache,id=uv-cache,target=/root/.cache/uv \
uv pip install ray[default] fastsafetensors