From a5416a75f3c1405c4a89d752fda26cc8a05f6930 Mon Sep 17 00:00:00 2001 From: HaimKortovich Date: Wed, 6 May 2026 16:37:39 -0500 Subject: [PATCH] add gateway and http route --- clusters/k3s-dgx/infrastructure/gateway.yaml | 12 ++++++++++++ clusters/k3s-dgx/nim-service/llama.yaml | 20 ++++++++++++++++++++ 2 files changed, 32 insertions(+) create mode 100644 clusters/k3s-dgx/infrastructure/gateway.yaml diff --git a/clusters/k3s-dgx/infrastructure/gateway.yaml b/clusters/k3s-dgx/infrastructure/gateway.yaml new file mode 100644 index 0000000..7cd386a --- /dev/null +++ b/clusters/k3s-dgx/infrastructure/gateway.yaml @@ -0,0 +1,12 @@ +apiVersion: gateway.networking.k8s.io/v1 +kind: Gateway +metadata: + name: envoy-gateway + namespace: default +spec: + gatewayClassName: envoy + listeners: + - name: http + protocol: HTTP + port: 80 + hostname: "llm.mycompany.com" diff --git a/clusters/k3s-dgx/nim-service/llama.yaml b/clusters/k3s-dgx/nim-service/llama.yaml index 68d4e42..912f87a 100644 --- a/clusters/k3s-dgx/nim-service/llama.yaml +++ b/clusters/k3s-dgx/nim-service/llama.yaml @@ -42,3 +42,23 @@ spec: service: type: ClusterIP port: 8000 +--- +apiVersion: gateway.networking.k8s.io/v1 +kind: HTTPRoute +metadata: + name: llm-route + namespace: nim-service +spec: + parentRefs: + - name: envoy-gateway + namespace: default + hostnames: + - "llm.mycompany.com" + rules: + - matches: + - path: + type: PathPrefix + value: / + backendRefs: + - name: meta-llama-3-1-8b-instruct + port: 8000