Skip to content

Commit 663bb6e

Browse files
committed
Updates artifacts for v0.3.0-rc.1 release
Signed-off-by: Kellen Swain <[email protected]>
1 parent fa463df commit 663bb6e

File tree

3 files changed

+7
-7
lines changed

3 files changed

+7
-7
lines changed

config/charts/inferencepool/values.yaml

+3-3
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,9 @@ inferenceExtension:
22
replicas: 1
33
image:
44
name: epp
5-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
6-
tag: main
7-
pullPolicy: Always
5+
hub: registry.k8s.io/gateway-api-inference-extension
6+
tag: v0.3.0-rc.1
7+
pullPolicy: IfNotPresent
88
extProcPort: 9002
99

1010
inferencePool:

config/manifests/inferencepool-resources.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -48,8 +48,8 @@ spec:
4848
terminationGracePeriodSeconds: 130
4949
containers:
5050
- name: epp
51-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:main
52-
imagePullPolicy: Always
51+
image: registry.k8s.io/gateway-api-inference-extension/epp:v0.3.0-rc.1
52+
imagePullPolicy: IfNotPresent
5353
args:
5454
- -poolName
5555
- "vllm-llama3-8b-instruct"

config/manifests/vllm/gpu-deployment.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ spec:
1414
spec:
1515
containers:
1616
- name: vllm
17-
image: "vllm/vllm-openai:latest"
18-
imagePullPolicy: Always
17+
image: "vllm/vllm-openai:v0.8.2"
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"

0 commit comments

Comments
 (0)