set probes

This commit is contained in:
2026-05-07 16:16:21 -05:00
parent 64abcb1483
commit a092b6ffa5

View File

@@ -52,7 +52,9 @@ spec:
repository: vllm/vllm-openai repository: vllm/vllm-openai
tag: v0.19.1-cu130 tag: v0.19.1-cu130
pullPolicy: IfNotPresent pullPolicy: IfNotPresent
env:
- name: VLLM_CACHE_ROOT
value: /model-store/vllm-cache
command: command:
- python3 - python3
args: args:
@@ -91,6 +93,32 @@ spec:
resources: resources:
limits: limits:
nvidia.com/gpu: 1 nvidia.com/gpu: 1
livenessProbe:
httpGet:
path: /health
port: 8000
initialDelaySeconds: 120
periodSeconds: 30
timeoutSeconds: 10
failureThreshold: 10
readinessProbe:
httpGet:
path: /health
port: 8000
initialDelaySeconds: 30
periodSeconds: 15
timeoutSeconds: 10
failureThreshold: 20
startupProbe:
httpGet:
path: /health
port: 8000
initialDelaySeconds: 10
periodSeconds: 20
timeoutSeconds: 10
failureThreshold: 60
expose: expose:
service: service:
type: ClusterIP type: ClusterIP