add class back
This commit is contained in:
@@ -1,18 +1,22 @@
|
|||||||
apiVersion: "serving.kserve.io/v1beta1"
|
apiVersion: serving.kserve.io/v1beta1
|
||||||
kind: "InferenceService"
|
kind: InferenceService
|
||||||
metadata:
|
metadata:
|
||||||
name: "flower-sample"
|
name: huihui-granite
|
||||||
namespace: kserve
|
namespace: kserve
|
||||||
spec:
|
spec:
|
||||||
predictor:
|
predictor:
|
||||||
model:
|
model:
|
||||||
modelFormat:
|
modelFormat:
|
||||||
name: tensorflow
|
name: huggingface
|
||||||
storageUri: "gs://kfserving-examples/models/tensorflow/flowers"
|
args:
|
||||||
|
- --model_name=huihui-granite
|
||||||
|
storageUri: "hf://huihui-ai/Huihui-granite-4.1-30b-abliterated"
|
||||||
resources:
|
resources:
|
||||||
requests:
|
|
||||||
cpu: "100m"
|
|
||||||
memory: "256Mi"
|
|
||||||
limits:
|
limits:
|
||||||
cpu: "1"
|
cpu: "4"
|
||||||
memory: "1Gi"
|
memory: 16Gi
|
||||||
|
nvidia.com/gpu: "1"
|
||||||
|
requests:
|
||||||
|
cpu: "2"
|
||||||
|
memory: 8Gi
|
||||||
|
nvidia.com/gpu: "1"
|
||||||
|
|||||||
@@ -3,4 +3,4 @@ kind: Kustomization
|
|||||||
resources:
|
resources:
|
||||||
- cert-manager.yaml
|
- cert-manager.yaml
|
||||||
- envoy-gateway-system.yaml
|
- envoy-gateway-system.yaml
|
||||||
# - envoy-gateway-class.yaml
|
- envoy-gateway-class.yaml
|
||||||
|
|||||||
@@ -4,5 +4,5 @@ resources:
|
|||||||
- flux-system
|
- flux-system
|
||||||
- gpu-support
|
- gpu-support
|
||||||
- infrastructure
|
- infrastructure
|
||||||
# - kserve
|
- kserve
|
||||||
# - apps
|
# - apps
|
||||||
|
|||||||
Reference in New Issue
Block a user