Files
edge-gitops/clusters/k3s-dgx/apps/huihui-granite-inference.yaml
2026-05-05 14:01:20 -05:00

19 lines
405 B
YAML

apiVersion: "serving.kserve.io/v1beta1"
kind: "InferenceService"
metadata:
name: "flower-sample"
namespace: kserve
spec:
predictor:
model:
modelFormat:
name: tensorflow
storageUri: "gs://kfserving-examples/models/tensorflow/flowers"
resources:
requests:
cpu: "100m"
memory: "256Mi"
limits:
cpu: "1"
memory: "1Gi"