File tree 3 files changed +141
-0
lines changed
deploy/components/vllm-sim
3 files changed +141
-0
lines changed Original file line number Diff line number Diff line change
1
+ apiVersion : apps/v1
2
+ kind : Deployment
3
+ metadata :
4
+ name : vllm-30801
5
+ labels :
6
+ app : vllm-30801
7
+ spec :
8
+ replicas : 1
9
+ selector :
10
+ matchLabels :
11
+ app : vllm-30801
12
+ template :
13
+ metadata :
14
+ labels :
15
+ app : vllm-30801
16
+ ai-aware-router-pod : " true"
17
+ annotations :
18
+ ai-aware-router-address : 127.0.0.1:30801
19
+ spec :
20
+ containers :
21
+ - name : vllm
22
+ image : vllm-sim/vllm-sim:latest
23
+ args :
24
+ - " --port=30801"
25
+ - " --model=model1"
26
+ - " --lora=lora1,lora2"
27
+ ports :
28
+ - containerPort : 30801
29
+ ---
30
+ apiVersion : apps/v1
31
+ kind : Deployment
32
+ metadata :
33
+ name : vllm-30802
34
+ labels :
35
+ app : vllm-30802
36
+ spec :
37
+ replicas : 1
38
+ selector :
39
+ matchLabels :
40
+ app : vllm-30802
41
+ template :
42
+ metadata :
43
+ labels :
44
+ app : vllm-30802
45
+ ai-aware-router-pod : " true"
46
+ annotations :
47
+ ai-aware-router-address : 127.0.0.1:30802
48
+ spec :
49
+ containers :
50
+ - name : vllm
51
+ image : vllm-sim/vllm-sim:latest
52
+ args :
53
+ - " --port=30802"
54
+ - " --model=model1"
55
+ - " --lora=lora1,lora2"
56
+ ports :
57
+ - containerPort : 30802
58
+ ---
59
+ apiVersion : apps/v1
60
+ kind : Deployment
61
+ metadata :
62
+ name : vllm-30803
63
+ labels :
64
+ app : vllm-30803
65
+ spec :
66
+ replicas : 1
67
+ selector :
68
+ matchLabels :
69
+ app : vllm-30803
70
+ template :
71
+ metadata :
72
+ labels :
73
+ app : vllm-30803
74
+ ai-aware-router-pod : " true"
75
+ annotations :
76
+ ai-aware-router-address : 127.0.0.1:30803
77
+ spec :
78
+ containers :
79
+ - name : vllm
80
+ image : vllm-sim/vllm-sim:latest
81
+ args :
82
+ - " --port=30803"
83
+ - " --model=model2"
84
+ - " --lora=lora3"
85
+ ports :
86
+ - containerPort : 30803
Original file line number Diff line number Diff line change
1
+ # ------------------------------------------------------------------------------
2
+ # VLLM Simulator
3
+ #
4
+ # This deploys a VLLM simulator which can be used to simulate inference for
5
+ # small environments (e.g. Kubernetes In Docker (KIND) clusters) or for simple
6
+ # tests.
7
+ # ------------------------------------------------------------------------------
8
+ apiVersion : kustomize.config.k8s.io/v1beta1
9
+ kind : Kustomization
10
+
11
+ resources :
12
+ - deployments.yaml
13
+ - services.yaml
14
+
15
+ images :
16
+ - name : vllm-sim/vllm-sim
17
+ newTag : 0.0.2
Original file line number Diff line number Diff line change
1
+ kind : Service
2
+ apiVersion : v1
3
+ metadata :
4
+ name : vllm-30801
5
+ spec :
6
+ type : ClusterIP
7
+ selector :
8
+ app : vllm-30801
9
+ ports :
10
+ - protocol : TCP
11
+ port : 30801
12
+ targetPort : 30801
13
+ ---
14
+ kind : Service
15
+ apiVersion : v1
16
+ metadata :
17
+ name : vllm-30802
18
+ spec :
19
+ type : ClusterIP
20
+ selector :
21
+ app : vllm-30802
22
+ ports :
23
+ - protocol : TCP
24
+ port : 30802
25
+ targetPort : 30802
26
+ ---
27
+ kind : Service
28
+ apiVersion : v1
29
+ metadata :
30
+ name : vllm-30803
31
+ spec :
32
+ type : ClusterIP
33
+ selector :
34
+ app : vllm-30803
35
+ ports :
36
+ - protocol : TCP
37
+ port : 30803
38
+ targetPort : 30803
You can’t perform that action at this time.
0 commit comments