test tensorflow

This commit is contained in:
2026-05-05 14:01:20 -05:00
parent b34cf2eee1
commit 467f19f408

View File

@@ -1,22 +1,18 @@
apiVersion: "serving.kserve.io/v1beta1" apiVersion: "serving.kserve.io/v1beta1"
kind: "InferenceService" kind: "InferenceService"
metadata: metadata:
name: "qwen-llm" name: "flower-sample"
namespace: kserve namespace: kserve
spec: spec:
predictor: predictor:
model: model:
modelFormat: modelFormat:
name: huggingface name: tensorflow
args: storageUri: "gs://kfserving-examples/models/tensorflow/flowers"
- --model_name=qwen
storageUri: "hf://Qwen/Qwen2.5-0.5B-Instruct"
resources: resources:
limits:
cpu: "2"
memory: 6Gi
nvidia.com/gpu: "1"
requests: requests:
cpu: "100m"
memory: "256Mi"
limits:
cpu: "1" cpu: "1"
memory: 4Gi memory: "1Gi"
nvidia.com/gpu: "1"