From 91164af48734723a474d3070a495b7590db499a1 Mon Sep 17 00:00:00 2001 From: Abhishek Malvankar Date: Mon, 6 Apr 2026 21:43:48 -0400 Subject: [PATCH] satv2 hack fix bypass namespace isolation on prom --- internal/collector/registration/queueing_model.go | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/internal/collector/registration/queueing_model.go b/internal/collector/registration/queueing_model.go index 8f93d2398..93e4efe80 100644 --- a/internal/collector/registration/queueing_model.go +++ b/internal/collector/registration/queueing_model.go @@ -39,7 +39,9 @@ func RegisterQueueingModelQueries(sourceRegistry *source.SourceRegistry) { Name: QuerySchedulerDispatchRate, Type: source.QueryTypePromQL, Template: `sum by (pod_name, namespace) (rate(inference_extension_scheduler_attempts_total{status="success",namespace="{{.namespace}}",target_model_name="{{.modelID}}"}[1m]))` + - ` or sum by (pod_name, namespace) (rate(inference_extension_scheduler_attempts_total{status="success",namespace="{{.namespace}}",model_name="{{.modelID}}",target_model_name=""}[1m]))`, + ` or sum by (pod_name, namespace) (rate(inference_extension_scheduler_attempts_total{status="success",namespace="{{.namespace}}",model_name="{{.modelID}}",target_model_name=""}[1m]))` + + ` or sum by (pod_name) (rate(inference_extension_scheduler_attempts_total{status="success",target_model_name="{{.modelID}}"}[1m]))` + + ` or sum by (pod_name) (rate(inference_extension_scheduler_attempts_total{status="success",model_name="{{.modelID}}",target_model_name=""}[1m]))`, Params: []string{source.ParamNamespace, source.ParamModelID}, Description: "Request dispatch rate per endpoint (requests/sec) from scheduler, " + "representing the arrival rate to each replica for a specific model",