From fa463df1b029cad8b0ab284d0b4bff9ec95d2a60 Mon Sep 17 00:00:00 2001 From: Kellen Swain Date: Thu, 24 Apr 2025 13:52:43 -0700 Subject: [PATCH 1/5] Update issue templates --- .github/ISSUE_TEMPLATE/bug_request.md | 4 +++- .github/ISSUE_TEMPLATE/feature_request.md | 3 +-- .github/ISSUE_TEMPLATE/new-release.md | 1 + 3 files changed, 5 insertions(+), 3 deletions(-) diff --git a/.github/ISSUE_TEMPLATE/bug_request.md b/.github/ISSUE_TEMPLATE/bug_request.md index c2597eb3..15ed35e1 100644 --- a/.github/ISSUE_TEMPLATE/bug_request.md +++ b/.github/ISSUE_TEMPLATE/bug_request.md @@ -1,7 +1,9 @@ --- name: Bug Report about: Report a bug you encountered -labels: kind/bug +title: '' +labels: kind/bug, needs-triage +assignees: '' --- diff --git a/.github/ISSUE_TEMPLATE/feature_request.md b/.github/ISSUE_TEMPLATE/feature_request.md index 53a885c7..1eee5871 100644 --- a/.github/ISSUE_TEMPLATE/feature_request.md +++ b/.github/ISSUE_TEMPLATE/feature_request.md @@ -2,7 +2,7 @@ name: Feature request about: Suggest an idea for this project title: '' -labels: '' +labels: needs-triage assignees: '' --- @@ -12,4 +12,3 @@ assignees: '' **What would you like to be added**: **Why is this needed**: - diff --git a/.github/ISSUE_TEMPLATE/new-release.md b/.github/ISSUE_TEMPLATE/new-release.md index be569844..27e83784 100644 --- a/.github/ISSUE_TEMPLATE/new-release.md +++ b/.github/ISSUE_TEMPLATE/new-release.md @@ -4,6 +4,7 @@ about: Propose a new release title: Release v0.x.0 labels: '' assignees: '' + --- - [Introduction](#introduction) From 663bb6ec32a657d54f2d1e981a5c18843a3a9a1e Mon Sep 17 00:00:00 2001 From: Kellen Swain Date: Tue, 1 Apr 2025 01:02:18 +0000 Subject: [PATCH 2/5] Updates artifacts for v0.3.0-rc.1 release Signed-off-by: Kellen Swain --- config/charts/inferencepool/values.yaml | 6 +++--- config/manifests/inferencepool-resources.yaml | 4 ++-- config/manifests/vllm/gpu-deployment.yaml | 4 ++-- 3 files changed, 7 insertions(+), 7 deletions(-) diff --git a/config/charts/inferencepool/values.yaml b/config/charts/inferencepool/values.yaml index bd48f37e..e673d22c 100644 --- a/config/charts/inferencepool/values.yaml +++ b/config/charts/inferencepool/values.yaml @@ -2,9 +2,9 @@ inferenceExtension: replicas: 1 image: name: epp - hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension - tag: main - pullPolicy: Always + hub: registry.k8s.io/gateway-api-inference-extension + tag: v0.3.0-rc.1 + pullPolicy: IfNotPresent extProcPort: 9002 inferencePool: diff --git a/config/manifests/inferencepool-resources.yaml b/config/manifests/inferencepool-resources.yaml index 3d978292..6984ccff 100644 --- a/config/manifests/inferencepool-resources.yaml +++ b/config/manifests/inferencepool-resources.yaml @@ -48,8 +48,8 @@ spec: terminationGracePeriodSeconds: 130 containers: - name: epp - image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:main - imagePullPolicy: Always + image: registry.k8s.io/gateway-api-inference-extension/epp:v0.3.0-rc.1 + imagePullPolicy: IfNotPresent args: - -poolName - "vllm-llama3-8b-instruct" diff --git a/config/manifests/vllm/gpu-deployment.yaml b/config/manifests/vllm/gpu-deployment.yaml index 16f93882..1c06e440 100644 --- a/config/manifests/vllm/gpu-deployment.yaml +++ b/config/manifests/vllm/gpu-deployment.yaml @@ -14,8 +14,8 @@ spec: spec: containers: - name: vllm - image: "vllm/vllm-openai:latest" - imagePullPolicy: Always + image: "vllm/vllm-openai:v0.8.2" + imagePullPolicy: IfNotPresent command: ["python3", "-m", "vllm.entrypoints.openai.api_server"] args: - "--model" From dd040fb8a4abdf78bc0a6029af5eee6ae65c9332 Mon Sep 17 00:00:00 2001 From: Kellen Swain Date: Tue, 1 Apr 2025 03:00:49 +0000 Subject: [PATCH 3/5] Updates bbr chart for v0.3.0-rc.1 release Signed-off-by: Kellen Swain --- config/charts/body-based-routing/values.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/config/charts/body-based-routing/values.yaml b/config/charts/body-based-routing/values.yaml index 0b88dc43..0bc9abda 100644 --- a/config/charts/body-based-routing/values.yaml +++ b/config/charts/body-based-routing/values.yaml @@ -3,8 +3,8 @@ bbr: replicas: 1 image: name: bbr - hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension - tag: main + hub: registry.k8s.io/gateway-api-inference-extension + tag: v0.3.0-rc.1 pullPolicy: Always port: 9004 healthCheckPort: 9005 From 48805810444f976f570db9eb145abe7b9bebce2e Mon Sep 17 00:00:00 2001 From: Kellen Swain Date: Wed, 2 Apr 2025 21:48:45 +0000 Subject: [PATCH 4/5] Updates artifacts for v0.3.0 release Signed-off-by: Kellen Swain --- config/charts/body-based-routing/values.yaml | 2 +- config/charts/inferencepool/values.yaml | 2 +- config/manifests/inferencepool-resources.yaml | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/config/charts/body-based-routing/values.yaml b/config/charts/body-based-routing/values.yaml index 0bc9abda..2a507b2a 100644 --- a/config/charts/body-based-routing/values.yaml +++ b/config/charts/body-based-routing/values.yaml @@ -4,7 +4,7 @@ bbr: image: name: bbr hub: registry.k8s.io/gateway-api-inference-extension - tag: v0.3.0-rc.1 + tag: v0.3.0 pullPolicy: Always port: 9004 healthCheckPort: 9005 diff --git a/config/charts/inferencepool/values.yaml b/config/charts/inferencepool/values.yaml index e673d22c..d9b90289 100644 --- a/config/charts/inferencepool/values.yaml +++ b/config/charts/inferencepool/values.yaml @@ -3,7 +3,7 @@ inferenceExtension: image: name: epp hub: registry.k8s.io/gateway-api-inference-extension - tag: v0.3.0-rc.1 + tag: v0.3.0 pullPolicy: IfNotPresent extProcPort: 9002 diff --git a/config/manifests/inferencepool-resources.yaml b/config/manifests/inferencepool-resources.yaml index 6984ccff..e4a42754 100644 --- a/config/manifests/inferencepool-resources.yaml +++ b/config/manifests/inferencepool-resources.yaml @@ -48,7 +48,7 @@ spec: terminationGracePeriodSeconds: 130 containers: - name: epp - image: registry.k8s.io/gateway-api-inference-extension/epp:v0.3.0-rc.1 + image: registry.k8s.io/gateway-api-inference-extension/epp:v0.3.0 imagePullPolicy: IfNotPresent args: - -poolName From dd98e5c648f1cf1df81c798fece40520e8c29385 Mon Sep 17 00:00:00 2001 From: Kellen Swain Date: Thu, 24 Apr 2025 21:01:52 +0000 Subject: [PATCH 5/5] Adding blank issue template so that all issues start with label --- .github/ISSUE_TEMPLATE/issue_template.md | 8 ++++++++ config/charts/body-based-routing/values.yaml | 4 ++-- config/charts/inferencepool/values.yaml | 6 +++--- config/manifests/inferencepool-resources.yaml | 4 ++-- config/manifests/vllm/gpu-deployment.yaml | 4 ++-- 5 files changed, 17 insertions(+), 9 deletions(-) create mode 100644 .github/ISSUE_TEMPLATE/issue_template.md diff --git a/.github/ISSUE_TEMPLATE/issue_template.md b/.github/ISSUE_TEMPLATE/issue_template.md new file mode 100644 index 00000000..1a2c8c6f --- /dev/null +++ b/.github/ISSUE_TEMPLATE/issue_template.md @@ -0,0 +1,8 @@ +--- +name: Blank Issue +about: '' +title: '' +labels: needs-triage +assignees: '' + +--- \ No newline at end of file diff --git a/config/charts/body-based-routing/values.yaml b/config/charts/body-based-routing/values.yaml index 2a507b2a..0b88dc43 100644 --- a/config/charts/body-based-routing/values.yaml +++ b/config/charts/body-based-routing/values.yaml @@ -3,8 +3,8 @@ bbr: replicas: 1 image: name: bbr - hub: registry.k8s.io/gateway-api-inference-extension - tag: v0.3.0 + hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension + tag: main pullPolicy: Always port: 9004 healthCheckPort: 9005 diff --git a/config/charts/inferencepool/values.yaml b/config/charts/inferencepool/values.yaml index d9b90289..bd48f37e 100644 --- a/config/charts/inferencepool/values.yaml +++ b/config/charts/inferencepool/values.yaml @@ -2,9 +2,9 @@ inferenceExtension: replicas: 1 image: name: epp - hub: registry.k8s.io/gateway-api-inference-extension - tag: v0.3.0 - pullPolicy: IfNotPresent + hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension + tag: main + pullPolicy: Always extProcPort: 9002 inferencePool: diff --git a/config/manifests/inferencepool-resources.yaml b/config/manifests/inferencepool-resources.yaml index e4a42754..3d978292 100644 --- a/config/manifests/inferencepool-resources.yaml +++ b/config/manifests/inferencepool-resources.yaml @@ -48,8 +48,8 @@ spec: terminationGracePeriodSeconds: 130 containers: - name: epp - image: registry.k8s.io/gateway-api-inference-extension/epp:v0.3.0 - imagePullPolicy: IfNotPresent + image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:main + imagePullPolicy: Always args: - -poolName - "vllm-llama3-8b-instruct" diff --git a/config/manifests/vllm/gpu-deployment.yaml b/config/manifests/vllm/gpu-deployment.yaml index 1c06e440..16f93882 100644 --- a/config/manifests/vllm/gpu-deployment.yaml +++ b/config/manifests/vllm/gpu-deployment.yaml @@ -14,8 +14,8 @@ spec: spec: containers: - name: vllm - image: "vllm/vllm-openai:v0.8.2" - imagePullPolicy: IfNotPresent + image: "vllm/vllm-openai:latest" + imagePullPolicy: Always command: ["python3", "-m", "vllm.entrypoints.openai.api_server"] args: - "--model"