Skip to content

Commit 8c4eb46

Browse files
committed
feat: add vllm simulator deployment
Signed-off-by: Shane Utt <[email protected]>
1 parent 6d12b06 commit 8c4eb46

File tree

3 files changed

+141
-0
lines changed

3 files changed

+141
-0
lines changed
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,86 @@
1+
apiVersion: apps/v1
2+
kind: Deployment
3+
metadata:
4+
name: vllm-30801
5+
labels:
6+
app: vllm-30801
7+
spec:
8+
replicas: 1
9+
selector:
10+
matchLabels:
11+
app: vllm-30801
12+
template:
13+
metadata:
14+
labels:
15+
app: vllm-30801
16+
ai-aware-router-pod: "true"
17+
annotations:
18+
ai-aware-router-address: 127.0.0.1:30801
19+
spec:
20+
containers:
21+
- name: vllm
22+
image: vllm-sim/vllm-sim:latest
23+
args:
24+
- "--port=30801"
25+
- "--model=model1"
26+
- "--lora=lora1,lora2"
27+
ports:
28+
- containerPort: 30801
29+
---
30+
apiVersion: apps/v1
31+
kind: Deployment
32+
metadata:
33+
name: vllm-30802
34+
labels:
35+
app: vllm-30802
36+
spec:
37+
replicas: 1
38+
selector:
39+
matchLabels:
40+
app: vllm-30802
41+
template:
42+
metadata:
43+
labels:
44+
app: vllm-30802
45+
ai-aware-router-pod: "true"
46+
annotations:
47+
ai-aware-router-address: 127.0.0.1:30802
48+
spec:
49+
containers:
50+
- name: vllm
51+
image: vllm-sim/vllm-sim:latest
52+
args:
53+
- "--port=30802"
54+
- "--model=model1"
55+
- "--lora=lora1,lora2"
56+
ports:
57+
- containerPort: 30802
58+
---
59+
apiVersion: apps/v1
60+
kind: Deployment
61+
metadata:
62+
name: vllm-30803
63+
labels:
64+
app: vllm-30803
65+
spec:
66+
replicas: 1
67+
selector:
68+
matchLabels:
69+
app: vllm-30803
70+
template:
71+
metadata:
72+
labels:
73+
app: vllm-30803
74+
ai-aware-router-pod: "true"
75+
annotations:
76+
ai-aware-router-address: 127.0.0.1:30803
77+
spec:
78+
containers:
79+
- name: vllm
80+
image: vllm-sim/vllm-sim:latest
81+
args:
82+
- "--port=30803"
83+
- "--model=model2"
84+
- "--lora=lora3"
85+
ports:
86+
- containerPort: 30803
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,17 @@
1+
# ------------------------------------------------------------------------------
2+
# VLLM Simulator
3+
#
4+
# This deploys a VLLM simulator which can be used to simulate inference for
5+
# small environments (e.g. Kubernetes In Docker (KIND) clusters) or for simple
6+
# tests.
7+
# ------------------------------------------------------------------------------
8+
apiVersion: kustomize.config.k8s.io/v1beta1
9+
kind: Kustomization
10+
11+
resources:
12+
- deployments.yaml
13+
- services.yaml
14+
15+
images:
16+
- name: vllm-sim/vllm-sim
17+
newTag: 0.0.2
+38
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,38 @@
1+
kind: Service
2+
apiVersion: v1
3+
metadata:
4+
name: vllm-30801
5+
spec:
6+
type: ClusterIP
7+
selector:
8+
app: vllm-30801
9+
ports:
10+
- protocol: TCP
11+
port: 30801
12+
targetPort: 30801
13+
---
14+
kind: Service
15+
apiVersion: v1
16+
metadata:
17+
name: vllm-30802
18+
spec:
19+
type: ClusterIP
20+
selector:
21+
app: vllm-30802
22+
ports:
23+
- protocol: TCP
24+
port: 30802
25+
targetPort: 30802
26+
---
27+
kind: Service
28+
apiVersion: v1
29+
metadata:
30+
name: vllm-30803
31+
spec:
32+
type: ClusterIP
33+
selector:
34+
app: vllm-30803
35+
ports:
36+
- protocol: TCP
37+
port: 30803
38+
targetPort: 30803

0 commit comments

Comments
 (0)