Skip to content

Commit 4e76473

Browse files
committed
chore: split kind environments into kgateway and istio based
Signed-off-by: Shane Utt <[email protected]>
1 parent cfea47b commit 4e76473

10 files changed

+97
-2
lines changed
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
# **WARNING** Only use in testing scenarios
2+
apiVersion: networking.istio.io/v1
3+
kind: DestinationRule
4+
metadata:
5+
name: endpoint-picker-insecure-tls
6+
spec:
7+
host: endpoint-picker
8+
trafficPolicy:
9+
tls:
10+
mode: SIMPLE
11+
insecureSkipVerify: true
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
# ------------------------------------------------------------------------------
2+
# Kubernetes In Docker (KIND) Environment
3+
#
4+
# This will deploy the full development stack on a KIND cluster:
5+
#
6+
# * Istio Control Plane
7+
# * VLLM Simulator
8+
# * Inference Gateway
9+
#
10+
# This will expose the VLLM simulator via InferencePool and an HTTPRoute.
11+
# ------------------------------------------------------------------------------
12+
apiVersion: kustomize.config.k8s.io/v1beta1
13+
kind: Kustomization
14+
15+
resources:
16+
- destination-rules.yaml
17+
- services.yaml
18+
- ../../../components/istio-control-plane/
19+
- ../../../components/vllm-sim/
20+
- ../../../components/inference-gateway/
21+
22+
patches:
23+
- path: patch-deployments.yaml
24+
- path: patch-gateways.yaml
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,10 @@
1+
apiVersion: gateway.networking.k8s.io/v1
2+
kind: Gateway
3+
metadata:
4+
name: inference-gateway
5+
labels:
6+
istio.io/enable-inference-extproc: "true"
7+
annotations:
8+
networking.istio.io/service-type: ClusterIP
9+
spec:
10+
gatewayClassName: istio

deploy/environments/dev/kind/kustomization.yaml renamed to deploy/environments/dev/kind-kgateway/kustomization.yaml

+1-1
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
#
44
# This will deploy the full development stack on a KIND cluster:
55
#
6-
# * Istio Control Plane
6+
# * KGateway Control Plane
77
# * VLLM Simulator
88
# * Inference Gateway
99
#
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,22 @@
1+
apiVersion: apps/v1
2+
kind: Deployment
3+
metadata:
4+
name: endpoint-picker
5+
spec:
6+
template:
7+
spec:
8+
containers:
9+
- name: epp
10+
args:
11+
- -poolName
12+
- "vllm-llama3-8b-instruct"
13+
- -poolNamespace
14+
- "default"
15+
- -v
16+
- "5"
17+
- --zap-encoder
18+
- "json"
19+
- -grpcPort
20+
- "9002"
21+
- -grpcHealthPort
22+
- "9003"
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
apiVersion: v1
2+
kind: Service
3+
metadata:
4+
annotations:
5+
networking.istio.io/service-type: NodePort
6+
labels:
7+
gateway.istio.io/managed: istio.io-gateway-controller
8+
gateway.networking.k8s.io/gateway-name: inference-gateway
9+
istio.io/enable-inference-extproc: "true"
10+
name: inference-gateway-istio
11+
namespace: default
12+
spec:
13+
type: NodePort
14+
selector:
15+
gateway.networking.k8s.io/gateway-name: inference-gateway
16+
ports:
17+
- appProtocol: tcp
18+
name: status-port
19+
port: 15021
20+
protocol: TCP
21+
targetPort: 15021
22+
nodePort: 32021
23+
- appProtocol: http
24+
name: default
25+
port: 80
26+
protocol: TCP
27+
targetPort: 80
28+
nodePort: 30080

scripts/kind-dev-env.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
#!/bin/bash
22

3-
# This shell script deploys a kind cluster with an Istio-based Gateway API
3+
# This shell script deploys a kind cluster with a KGateway-based Gateway API
44
# implementation fully configured. It deploys the vllm simulator, which it
55
# exposes with a Gateway -> HTTPRoute -> InferencePool. The Gateway is
66
# configured with the a filter for the ext_proc endpoint picker.

0 commit comments

Comments
 (0)