File tree 7 files changed +9
-15
lines changed
config/charts/inferencepool
7 files changed +9
-15
lines changed Original file line number Diff line number Diff line change 1
- InferencePool {{ .Values.inferencePool.name }} deployed.
1
+ InferencePool {{ .Release.Name }} deployed.
Original file line number Diff line number Diff line change @@ -12,7 +12,7 @@ app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
12
12
Inference extension name
13
13
*/} }
14
14
{ {- define " gateway-api-inference-extension.name" -} }
15
- { {- $base := .Values.inferencePool.name | default " default-pool" | lower | trim | trunc 40 -} }
15
+ { {- $base := .Release.Name | default " default-pool" | lower | trim | trunc 40 -} }
16
16
{ { $base } }-epp
17
17
{ {- end -} }
18
18
Original file line number Diff line number Diff line change 2
2
common validations
3
3
*/} }
4
4
{ {- define " gateway-api-inference-extension.validations.inferencepool.common" -} }
5
- { {- if not $.Values.inferencePool.name } }
6
- { {- fail " missing .Values.inferencePool.name" } }
7
- { {- end } }
8
-
9
-
10
5
{ {- if or (empty $.Values.inferencePool.modelServers) (not $.Values.inferencePool.modelServers.matchLabels) } }
11
6
{ {- fail " .Values.inferencePool.modelServers.matchLabels is required" } }
12
7
{ {- end } }
Original file line number Diff line number Diff line change 22
22
imagePullPolicy : {{ .Values.inferenceExtension.image.pullPolicy | default "Always" }}
23
23
args :
24
24
- -poolName
25
- - {{ .Values.inferencePool.name }}
25
+ - {{ .Release.Name }}
26
26
- -poolNamespace
27
27
- {{ .Release.Namespace }}
28
28
- -v
Original file line number Diff line number Diff line change 3
3
kind : HealthCheckPolicy
4
4
apiVersion : networking.gke.io/v1
5
5
metadata :
6
- name : {{ .Values.inferencePool.name }}
6
+ name : {{ .Release.Name }}
7
7
namespace : {{ .Release.Namespace }}
8
8
labels :
9
9
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
10
10
spec :
11
11
targetRef :
12
12
group : " inference.networking.x-k8s.io"
13
13
kind : InferencePool
14
- name : {{ .Values.inferencePool.name }}
14
+ name : {{ .Release.Name }}
15
15
default :
16
16
config :
17
17
type : HTTP
@@ -22,22 +22,22 @@ spec:
22
22
apiVersion : networking.gke.io/v1
23
23
kind : GCPBackendPolicy
24
24
metadata :
25
- name : {{ .Values.inferencePool.name }}
25
+ name : {{ .Release.Name }}
26
26
namespace : {{ .Release.Namespace }}
27
27
labels :
28
28
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
29
29
spec :
30
30
targetRef :
31
31
group : " inference.networking.x-k8s.io"
32
32
kind : InferencePool
33
- name : {{ .Values.inferencePool.name }}
33
+ name : {{ .Release.Name }}
34
34
default :
35
35
timeoutSec : 300 # 5-minute timeout (adjust as needed)
36
36
---
37
37
apiVersion : monitoring.googleapis.com/v1
38
38
kind : ClusterPodMonitoring
39
39
metadata :
40
- name : {{ .Release.Namespace }}-{{ .Values.inferencePool.name }}
40
+ name : {{ .Release.Namespace }}-{{ .Release.Name }}
41
41
labels :
42
42
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
43
43
spec :
Original file line number Diff line number Diff line change 2
2
apiVersion : inference.networking.x-k8s.io/v1alpha2
3
3
kind : InferencePool
4
4
metadata :
5
- name : {{ .Values.inferencePool.name }}
5
+ name : {{ .Release.Name }}
6
6
namespace : {{ .Release.Namespace }}
7
7
labels :
8
8
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
Original file line number Diff line number Diff line change @@ -8,7 +8,6 @@ inferenceExtension:
8
8
extProcPort : 9002
9
9
10
10
inferencePool :
11
- # name: pool-1 # REQUIRED
12
11
targetPortNumber : 8000
13
12
# modelServers: # REQUIRED
14
13
# matchLabels:
You can’t perform that action at this time.
0 commit comments