Skip to content

Commit d90bdce

Browse files
committed
fix: metric reset not effect
Signed-off-by: nayihz <[email protected]>
1 parent 3d61501 commit d90bdce

File tree

6 files changed

+23
-24
lines changed

6 files changed

+23
-24
lines changed

cmd/bbr/main.go

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,8 +32,8 @@ import (
3232
metricsserver "sigs.k8s.io/controller-runtime/pkg/metrics/server"
3333

3434
"sigs.k8s.io/gateway-api-inference-extension/internal/runnable"
35+
"sigs.k8s.io/gateway-api-inference-extension/pkg/bbr/metrics"
3536
runserver "sigs.k8s.io/gateway-api-inference-extension/pkg/bbr/server"
36-
"sigs.k8s.io/gateway-api-inference-extension/pkg/epp/metrics"
3737
"sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/logging"
3838
)
3939

cmd/epp/main.go

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -154,10 +154,6 @@ func run() error {
154154
return err
155155
}
156156

157-
poolNamespacedName := types.NamespacedName{
158-
Name: *poolName,
159-
Namespace: *poolNamespace,
160-
}
161157
metrics.Register()
162158
// Register metrics handler.
163159
// Metrics endpoint is enabled in 'config/default/kustomization.yaml'. The Metrics options configure the server.
@@ -169,6 +165,10 @@ func run() error {
169165
FilterProvider: filters.WithAuthenticationAndAuthorization,
170166
}
171167

168+
poolNamespacedName := types.NamespacedName{
169+
Name: *poolName,
170+
Namespace: *poolNamespace,
171+
}
172172
mgr, err := runserver.NewDefaultManager(poolNamespacedName, cfg, metricsServerOptions)
173173
if err != nil {
174174
setupLog.Error(err, "Failed to create controller manager")

pkg/epp/metrics/metrics.go

Lines changed: 14 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -309,20 +309,20 @@ func Register() {
309309
}
310310

311311
// Just for integration test
312-
func Unregister() {
313-
metrics.Registry.Unregister(requestCounter)
314-
metrics.Registry.Unregister(requestErrCounter)
315-
metrics.Registry.Unregister(requestLatencies)
316-
metrics.Registry.Unregister(requestSizes)
317-
metrics.Registry.Unregister(responseSizes)
318-
metrics.Registry.Unregister(inputTokens)
319-
metrics.Registry.Unregister(outputTokens)
320-
metrics.Registry.Unregister(runningRequests)
321-
metrics.Registry.Unregister(NormalizedTimePerOutputToken)
322-
323-
metrics.Registry.Unregister(inferencePoolAvgKVCache)
324-
metrics.Registry.Unregister(inferencePoolAvgQueueSize)
325-
metrics.Registry.Unregister(inferencePoolReadyPods)
312+
func Reset() {
313+
requestCounter.Reset()
314+
requestErrCounter.Reset()
315+
requestLatencies.Reset()
316+
requestSizes.Reset()
317+
responseSizes.Reset()
318+
inputTokens.Reset()
319+
outputTokens.Reset()
320+
runningRequests.Reset()
321+
NormalizedTimePerOutputToken.Reset()
322+
inferencePoolAvgKVCache.Reset()
323+
inferencePoolAvgQueueSize.Reset()
324+
inferencePoolReadyPods.Reset()
325+
SchedulerPluginProcessingLatencies.Reset()
326326
}
327327

328328
// RecordRequstCounter records the number of requests.

pkg/epp/metrics/testdata/scheduler_e2e_duration_seconds_metric

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# HELP inference_extension_scheduler_e2e_duration_seconds [ALPHA] End-to-end scheduling latency distribution in seconds.
1+
# HELP inference_extension_scheduler_e2e_duration_seconds End-to-end scheduling latency distribution in seconds.
22
# TYPE inference_extension_scheduler_e2e_duration_seconds histogram
33
inference_extension_scheduler_e2e_duration_seconds_bucket{le="0.0001"} 0
44
inference_extension_scheduler_e2e_duration_seconds_bucket{le="0.0002"} 1

pkg/epp/metrics/testdata/scheduler_plugin_processing_latencies_metric

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# HELP inference_extension_scheduler_plugin_duration_seconds [ALPHA] Scheduler plugin processing latency distribution in seconds for each plugin type and plugin name.
1+
# HELP inference_extension_scheduler_plugin_duration_seconds Scheduler plugin processing latency distribution in seconds for each plugin type and plugin name.
22
# TYPE inference_extension_scheduler_plugin_duration_seconds histogram
33
inference_extension_scheduler_plugin_duration_seconds_bucket{plugin_name="PluginA",plugin_type="PreSchedule",le="0.0001"} 0
44
inference_extension_scheduler_plugin_duration_seconds_bucket{plugin_name="PluginA",plugin_type="PreSchedule",le="0.0002"} 0

test/integration/epp/hermetic_test.go

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1258,7 +1258,6 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
12581258

12591259
for _, test := range tests {
12601260
t.Run(test.name, func(t *testing.T) {
1261-
metrics.Register()
12621261
client, cleanup := setUpHermeticServer(t, test.pods, true)
12631262
t.Cleanup(cleanup)
12641263
responses, err := integrationutils.StreamedRequest(t, client, test.requests, len(test.wantResponses))
@@ -1277,9 +1276,8 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
12771276
}
12781277
}
12791278
}
1280-
metrics.Unregister()
1279+
metrics.Reset()
12811280
})
1282-
return
12831281
}
12841282
}
12851283

@@ -1394,6 +1392,7 @@ func BeforeSuite() func() {
13941392
// Init runtime.
13951393
ctrl.SetLogger(logger)
13961394

1395+
metrics.Register()
13971396
// Register metrics handler.
13981397
// Metrics endpoint is enabled in 'config/default/kustomization.yaml'. The Metrics options configure the server.
13991398
// More info:

0 commit comments

Comments
 (0)