feat: add vllm simulator deployment

shaneutt · shaneutt · commit 8c4eb46917a8 · 2025-04-16T18:27:44.000-04:00
Signed-off-by: Shane Utt &lt;shaneutt@linux.com&gt;
diff --git a/deploy/components/vllm-sim/deployments.yaml b/deploy/components/vllm-sim/deployments.yaml
@@ -0,0 +1,86 @@
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: vllm-30801
+  labels:
+    app: vllm-30801
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: vllm-30801
+  template:
+    metadata:
+      labels:
+        app: vllm-30801
+        ai-aware-router-pod: "true"
+      annotations:
+        ai-aware-router-address: 127.0.0.1:30801
+    spec:
+      containers:
+      - name: vllm
+        image: vllm-sim/vllm-sim:latest
+        args:
+        - "--port=30801"
+        - "--model=model1"
+        - "--lora=lora1,lora2"
+        ports:
+          - containerPort: 30801
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: vllm-30802
+  labels:
+    app: vllm-30802
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: vllm-30802
+  template:
+    metadata:
+      labels:
+        app: vllm-30802
+        ai-aware-router-pod: "true"
+      annotations:
+        ai-aware-router-address: 127.0.0.1:30802
+    spec:
+      containers:
+      - name: vllm
+        image: vllm-sim/vllm-sim:latest
+        args:
+        - "--port=30802"
+        - "--model=model1"
+        - "--lora=lora1,lora2"
+        ports:
+          - containerPort: 30802
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: vllm-30803
+  labels:
+    app: vllm-30803
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: vllm-30803
+  template:
+    metadata:
+      labels:
+        app: vllm-30803
+        ai-aware-router-pod: "true"
+      annotations:
+        ai-aware-router-address: 127.0.0.1:30803
+    spec:
+      containers:
+      - name: vllm
+        image: vllm-sim/vllm-sim:latest
+        args:
+        - "--port=30803"
+        - "--model=model2"
+        - "--lora=lora3"
+        ports:
+          - containerPort: 30803
diff --git a/deploy/components/vllm-sim/kustomization.yaml b/deploy/components/vllm-sim/kustomization.yaml
@@ -0,0 +1,17 @@
+# ------------------------------------------------------------------------------
+# VLLM Simulator
+#
+# This deploys a VLLM simulator which can be used to simulate inference for
+# small environments (e.g. Kubernetes In Docker (KIND) clusters) or for simple
+# tests.
+# ------------------------------------------------------------------------------
+apiVersion: kustomize.config.k8s.io/v1beta1
+kind: Kustomization
+
+resources:
+- deployments.yaml
+- services.yaml
+
+images:
+- name: vllm-sim/vllm-sim
+  newTag: 0.0.2
diff --git a/deploy/components/vllm-sim/services.yaml b/deploy/components/vllm-sim/services.yaml
@@ -0,0 +1,38 @@
+kind: Service
+apiVersion: v1
+metadata:
+  name: vllm-30801
+spec:
+  type: ClusterIP
+  selector:
+    app: vllm-30801
+  ports:
+  - protocol: TCP
+    port: 30801
+    targetPort: 30801
+---
+kind: Service
+apiVersion: v1
+metadata:
+  name: vllm-30802
+spec:
+  type: ClusterIP
+  selector:
+    app: vllm-30802
+  ports:
+  - protocol: TCP
+    port: 30802
+    targetPort: 30802
+---
+kind: Service
+apiVersion: v1
+metadata:
+  name: vllm-30803
+spec:
+  type: ClusterIP
+  selector:
+    app: vllm-30803
+  ports:
+  - protocol: TCP
+    port: 30803
+    targetPort: 30803