Skip to content

Commit e8973c9

Browse files
committed
fix: metric reset not effect
Signed-off-by: nayihz <[email protected]>
1 parent 9306c97 commit e8973c9

File tree

6 files changed

+23
-24
lines changed

6 files changed

+23
-24
lines changed

cmd/bbr/main.go

+1-1
Original file line numberDiff line numberDiff line change
@@ -32,8 +32,8 @@ import (
3232
metricsserver "sigs.k8s.io/controller-runtime/pkg/metrics/server"
3333

3434
"sigs.k8s.io/gateway-api-inference-extension/internal/runnable"
35+
"sigs.k8s.io/gateway-api-inference-extension/pkg/bbr/metrics"
3536
runserver "sigs.k8s.io/gateway-api-inference-extension/pkg/bbr/server"
36-
"sigs.k8s.io/gateway-api-inference-extension/pkg/epp/metrics"
3737
"sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/logging"
3838
)
3939

cmd/epp/main.go

+4-4
Original file line numberDiff line numberDiff line change
@@ -133,10 +133,6 @@ func run() error {
133133
return err
134134
}
135135

136-
poolNamespacedName := types.NamespacedName{
137-
Name: *poolName,
138-
Namespace: *poolNamespace,
139-
}
140136
metrics.Register()
141137
// Register metrics handler.
142138
// Metrics endpoint is enabled in 'config/default/kustomization.yaml'. The Metrics options configure the server.
@@ -148,6 +144,10 @@ func run() error {
148144
FilterProvider: filters.WithAuthenticationAndAuthorization,
149145
}
150146

147+
poolNamespacedName := types.NamespacedName{
148+
Name: *poolName,
149+
Namespace: *poolNamespace,
150+
}
151151
mgr, err := runserver.NewDefaultManager(poolNamespacedName, cfg, metricsServerOptions)
152152
if err != nil {
153153
setupLog.Error(err, "Failed to create controller manager")

pkg/epp/metrics/metrics.go

+14-14
Original file line numberDiff line numberDiff line change
@@ -234,20 +234,20 @@ func Register() {
234234
}
235235

236236
// Just for integration test
237-
func Unregister() {
238-
metrics.Registry.Unregister(requestCounter)
239-
metrics.Registry.Unregister(requestErrCounter)
240-
metrics.Registry.Unregister(requestLatencies)
241-
metrics.Registry.Unregister(requestSizes)
242-
metrics.Registry.Unregister(responseSizes)
243-
metrics.Registry.Unregister(inputTokens)
244-
metrics.Registry.Unregister(outputTokens)
245-
metrics.Registry.Unregister(runningRequests)
246-
metrics.Registry.Unregister(NormalizedTimePerOutputToken)
247-
248-
metrics.Registry.Unregister(inferencePoolAvgKVCache)
249-
metrics.Registry.Unregister(inferencePoolAvgQueueSize)
250-
metrics.Registry.Unregister(inferencePoolReadyPods)
237+
func Reset() {
238+
requestCounter.Reset()
239+
requestErrCounter.Reset()
240+
requestLatencies.Reset()
241+
requestSizes.Reset()
242+
responseSizes.Reset()
243+
inputTokens.Reset()
244+
outputTokens.Reset()
245+
runningRequests.Reset()
246+
NormalizedTimePerOutputToken.Reset()
247+
inferencePoolAvgKVCache.Reset()
248+
inferencePoolAvgQueueSize.Reset()
249+
inferencePoolReadyPods.Reset()
250+
SchedulerPluginProcessingLatencies.Reset()
251251
}
252252

253253
// RecordRequstCounter records the number of requests.

pkg/epp/metrics/testdata/scheduler_e2e_duration_seconds_metric

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# HELP inference_extension_scheduler_e2e_duration_seconds [ALPHA] End-to-end scheduling latency distribution in seconds.
1+
# HELP inference_extension_scheduler_e2e_duration_seconds End-to-end scheduling latency distribution in seconds.
22
# TYPE inference_extension_scheduler_e2e_duration_seconds histogram
33
inference_extension_scheduler_e2e_duration_seconds_bucket{le="0.0001"} 0
44
inference_extension_scheduler_e2e_duration_seconds_bucket{le="0.0002"} 1

pkg/epp/metrics/testdata/scheduler_plugin_processing_latencies_metric

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# HELP inference_extension_scheduler_plugin_duration_seconds [ALPHA] Scheduler plugin processing latency distribution in seconds for each plugin type and plugin name.
1+
# HELP inference_extension_scheduler_plugin_duration_seconds Scheduler plugin processing latency distribution in seconds for each plugin type and plugin name.
22
# TYPE inference_extension_scheduler_plugin_duration_seconds histogram
33
inference_extension_scheduler_plugin_duration_seconds_bucket{plugin_name="PluginA",plugin_type="PreSchedule",le="0.0001"} 0
44
inference_extension_scheduler_plugin_duration_seconds_bucket{plugin_name="PluginA",plugin_type="PreSchedule",le="0.0002"} 0

test/integration/epp/hermetic_test.go

+2-3
Original file line numberDiff line numberDiff line change
@@ -1198,7 +1198,6 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
11981198

11991199
for _, test := range tests {
12001200
t.Run(test.name, func(t *testing.T) {
1201-
metrics.Register()
12021201
client, cleanup := setUpHermeticServer(t, test.pods, true)
12031202
t.Cleanup(cleanup)
12041203
responses, err := integrationutils.StreamedRequest(t, client, test.requests, len(test.wantResponses))
@@ -1217,9 +1216,8 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
12171216
}
12181217
}
12191218
}
1220-
metrics.Unregister()
1219+
metrics.Reset()
12211220
})
1222-
return
12231221
}
12241222
}
12251223

@@ -1334,6 +1332,7 @@ func BeforeSuite() func() {
13341332
// Init runtime.
13351333
ctrl.SetLogger(logger)
13361334

1335+
metrics.Register()
13371336
// Register metrics handler.
13381337
// Metrics endpoint is enabled in 'config/default/kustomization.yaml'. The Metrics options configure the server.
13391338
// More info:

0 commit comments

Comments
 (0)