diff --git a/acm/odh-core/acm-observability/files/uwl_metrics_list.yaml b/acm/odh-core/acm-observability/files/uwl_metrics_list.yaml index 49bf7d52..1081efb9 100644 --- a/acm/odh-core/acm-observability/files/uwl_metrics_list.yaml +++ b/acm/odh-core/acm-observability/files/uwl_metrics_list.yaml @@ -16,8 +16,8 @@ names: - ovms_request_time_us_bucket - ovms_request_time_us_count - ovms_request_time_us_sum - - ovms_requests_fail - - ovms_requests_success + - ovms_requests_fail_total + - ovms_requests_success_total - ovms_streams - ovms_wait_for_infer_req_time_us_bucket - ovms_wait_for_infer_req_time_us_count diff --git a/acm/odh-core/acm-observability/grafana-dashboards/edge-inference-health.json b/acm/odh-core/acm-observability/grafana-dashboards/edge-inference-health.json index 14225ed8..05ee7fb9 100644 --- a/acm/odh-core/acm-observability/grafana-dashboards/edge-inference-health.json +++ b/acm/odh-core/acm-observability/grafana-dashboards/edge-inference-health.json @@ -242,7 +242,7 @@ "targets": [ { "exemplar": true, - "expr": "sum(ovms_requests_success{cluster=~\"$cluster\"}) by(namespace)", + "expr": "sum(ovms_requests_success_total{cluster=~\"$cluster\"}) by(namespace)", "hide": false, "interval": "", "legendFormat": "{{namespace}} success", @@ -250,7 +250,7 @@ }, { "exemplar": true, - "expr": "sum(ovms_requests_fail{cluster=~\"$cluster\"}) by(namespace)", + "expr": "sum(ovms_requests_fail_total{cluster=~\"$cluster\"}) by(namespace)", "hide": false, "interval": "", "legendFormat": "{{namespace}} fail", diff --git a/acm/odh-edge/base/files/uwl_metrics_list.yaml b/acm/odh-edge/base/files/uwl_metrics_list.yaml index 49bf7d52..1081efb9 100644 --- a/acm/odh-edge/base/files/uwl_metrics_list.yaml +++ b/acm/odh-edge/base/files/uwl_metrics_list.yaml @@ -16,8 +16,8 @@ names: - ovms_request_time_us_bucket - ovms_request_time_us_count - ovms_request_time_us_sum - - ovms_requests_fail - - ovms_requests_success + - ovms_requests_fail_total + - ovms_requests_success_total - ovms_streams - ovms_wait_for_infer_req_time_us_bucket - ovms_wait_for_infer_req_time_us_count