File tree Expand file tree Collapse file tree 2 files changed +0
-53
lines changed
rhobs/alerting/data_plane
test/promql/tests/data_plane Expand file tree Collapse file tree 2 files changed +0
-53
lines changed Original file line number Diff line number Diff line change 7171 alert_routing_key : infra
7272 team : konflux-infra
7373 runbook_url : https://gitlab.cee.redhat.com/konflux/docs/sop/-/blob/main/o11y/alert-rules/alert-rule-MultiPlatformControllerPlatformUnhealthy.md
74-
75- - name : multi-platform-controller-metrics-health
76- interval : 30s
77- rules :
78- - alert : MultiPlatformControllerMetricsUnhealthy
79- expr : |
80- count by (source_cluster) (multi_platform_controller_running_tasks < 0 or multi_platform_controller_waiting_tasks < 0) > 0
81- for : 1m
82- labels :
83- severity : warning
84- annotations :
85- summary : >-
86- Multi-platform controller metrics are unhealthy in cluster {{ $labels.source_cluster }}
87- description : >-
88- The multi-platform controller Gauge metrics are showing negative values for the last 1 minute in cluster {{ $labels.source_cluster }}
89- alert_routing_key : infra
90- team : konflux-infra
Original file line number Diff line number Diff line change @@ -103,39 +103,3 @@ tests:
103103 alert_routing_key : infra
104104 team : konflux-infra
105105 runbook_url : https://gitlab.cee.redhat.com/konflux/docs/sop/-/blob/main/o11y/alert-rules/alert-rule-MultiPlatformControllerPlatformUnhealthy.md
106-
107- - interval : 30s
108- input_series :
109- - series : ' multi_platform_controller_running_tasks{source_cluster="c7"}'
110- values : ' -1 -1 -1 -1'
111- - series : ' multi_platform_controller_waiting_tasks{source_cluster="c7"}'
112- values : ' 5 5 5 5'
113- - series : ' multi_platform_controller_running_tasks{source_cluster="c8"}'
114- values : ' 3 3 3 3'
115- - series : ' multi_platform_controller_waiting_tasks{source_cluster="c8"}'
116- values : ' 1 -1 -1 -1'
117- - series : ' multi_platform_controller_running_tasks{source_cluster="c9"}'
118- values : ' 1 -1 1 -1'
119- - series : ' multi_platform_controller_waiting_tasks{source_cluster="c9"}'
120- values : ' 1 -1 0 1'
121-
122- alert_rule_test :
123- - eval_time : 2m
124- alertname : MultiPlatformControllerMetricsUnhealthy
125- exp_alerts :
126- - exp_labels :
127- severity : warning
128- source_cluster : c7
129- exp_annotations :
130- summary : Multi-platform controller metrics are unhealthy in cluster c7
131- description : The multi-platform controller Gauge metrics are showing negative values for the last 1 minute in cluster c7
132- alert_routing_key : infra
133- team : konflux-infra
134- - exp_labels :
135- severity : warning
136- source_cluster : c8
137- exp_annotations :
138- summary : Multi-platform controller metrics are unhealthy in cluster c8
139- description : The multi-platform controller Gauge metrics are showing negative values for the last 1 minute in cluster c8
140- alert_routing_key : infra
141- team : konflux-infra
You can’t perform that action at this time.
0 commit comments