openshift · openshift-merge-robot · Oct 20, 2021 · Oct 20, 2021
diff --git a/files/prometheus_alerts.yml b/files/prometheus_alerts.yml
@@ -11,6 +11,7 @@
       sum by (cluster) (es_cluster_status == 2)
     "for": 7m
     "labels":
+      "namespace": openshift-logging
       "severity": critical
 
   - "alert": ElasticsearchClusterNotHealthy
@@ -22,6 +23,7 @@
       sum by (cluster) (es_cluster_status == 1)
     "for": 20m
     "labels":
+      "namespace": openshift-logging
       "severity": warning
 
   - "alert": ElasticsearchWriteRequestsRejectionJumps
@@ -33,6 +35,7 @@
       round( writing:reject_ratio:rate2m * 100, 0.001 ) > 5
     "for": 10m
     "labels":
+      "namespace": openshift-logging
       "severity": warning
 
   - "alert": ElasticsearchNodeDiskWatermarkReached
@@ -51,6 +54,7 @@
       ) > on(instance, pod) es_cluster_routing_allocation_disk_watermark_low_pct
     "for": 5m
     "labels":
+      "namespace": openshift-logging
       "severity": info
 
   - "alert": ElasticsearchNodeDiskWatermarkReached
@@ -69,6 +73,7 @@
       ) > on(instance, pod) es_cluster_routing_allocation_disk_watermark_high_pct
     "for": 5m
     "labels":
+      "namespace": openshift-logging
       "severity": critical
 
   - "alert": ElasticsearchNodeDiskWatermarkReached
@@ -87,6 +92,7 @@
       ) > on(instance, pod) es_cluster_routing_allocation_disk_watermark_flood_stage_pct
     "for": 5m
     "labels":
+      "namespace": openshift-logging
       "severity": critical
 
   - "alert": ElasticsearchJVMHeapUseHigh
@@ -98,6 +104,7 @@
       sum by (cluster, instance, node) (es_jvm_mem_heap_used_percent) > 75
     "for": 10m
     "labels":
+      "namespace": openshift-logging
       "severity": info
 
   - "alert": AggregatedLoggingSystemCPUHigh
@@ -109,6 +116,7 @@
       sum by (cluster, instance, node) (es_os_cpu_percent) > 90
     "for": 1m
     "labels":
+      "namespace": openshift-logging
       "severity": info
 
   - "alert": ElasticsearchProcessCPUHigh
@@ -120,6 +128,7 @@
       sum by (cluster, instance, node) (es_process_cpu_percent) > 90
     "for": 1m
     "labels":
+      "namespace": openshift-logging
       "severity": info
 
   - "alert": ElasticsearchDiskSpaceRunningLow
@@ -131,6 +140,7 @@
       sum(predict_linear(es_fs_path_available_bytes[6h], 6 * 3600)) < 0
     "for": 1h
     "labels":
+      "namespace": openshift-logging
       "severity": critical
 
   - "alert": ElasticsearchHighFileDescriptorUsage
@@ -142,6 +152,7 @@
       predict_linear(es_process_file_descriptors_max_number[1h], 3600) - predict_linear(es_process_file_descriptors_open_number[1h], 3600) < 0
     "for": 10m
     "labels":
+      "namespace": openshift-logging
       "severity": warning
 
   - "alert": ElasticsearchOperatorCSVNotSuccessful
@@ -152,6 +163,7 @@
       csv_succeeded{name =~ "elasticsearch-operator.*"} == 0
     "for": 10m
     "labels":
+      "namespace": openshift-logging
       "severity": warning
 
   - "alert": ElasticsearchNodeDiskWatermarkReached
@@ -170,6 +182,7 @@
       ) > on(instance, pod) es_cluster_routing_allocation_disk_watermark_low_pct
     "for": 1h
     "labels":
+      "namespace": openshift-logging
       "severity": warning
 
   - "alert": ElasticsearchNodeDiskWatermarkReached
@@ -188,6 +201,7 @@
       ) > on(instance, pod) es_cluster_routing_allocation_disk_watermark_high_pct
     "for": 1h
     "labels":
+      "namespace": openshift-logging
       "severity": warning
 
   - "alert": ElasticsearchNodeDiskWatermarkReached
@@ -206,4 +220,5 @@
       ) > on(instance, pod) es_cluster_routing_allocation_disk_watermark_flood_stage_pct
     "for": 1h
     "labels":
+      "namespace": openshift-logging
       "severity": warning
diff --git a/test/files/prometheus-unit-tests/test.yml b/test/files/prometheus-unit-tests/test.yml
@@ -67,6 +67,7 @@ tests:
         exp_alerts:
           - exp_labels:
               cluster: elasticsearch
+              namespace: openshift-logging
               severity: warning
             exp_annotations:
               summary: "Cluster health status is YELLOW"
@@ -79,6 +80,7 @@ tests:
         exp_alerts:
           - exp_labels:
               cluster: elasticsearch
+              namespace: openshift-logging
               severity: critical
             exp_annotations:
               summary: "Cluster health status is RED"
@@ -98,6 +100,7 @@ tests:
               cluster: elasticsearch
               instance: localhost:9090
               node: elasticsearch-cdm-1
+              namespace: openshift-logging
               severity: warning
             exp_annotations:
               summary: "High Write Rejection Ratio - 10%"
@@ -117,6 +120,7 @@ tests:
           - exp_labels:
               instance: localhost:9090
               pod: pod-1
+              namespace: openshift-logging
               severity: info
             exp_annotations:
               summary: "Disk Low Watermark Reached - disk saturation is 90%"
@@ -130,6 +134,7 @@ tests:
           - exp_labels:
               instance: localhost:9091
               pod: pod-2
+              namespace: openshift-logging
               severity: warning
             exp_annotations:
               summary: "Disk Low Watermark is predicted to be reached within next 6h."
@@ -144,6 +149,7 @@ tests:
               cluster: elasticsearch
               instance: localhost:9090
               node: elasticsearch-cdm-1
+              namespace: openshift-logging
               severity: info
             exp_annotations:
               summary: "System CPU usage is high"
@@ -163,6 +169,7 @@ tests:
               cluster: elasticsearch
               instance: localhost:9090
               node: elasticsearch-cdm-1
+              namespace: openshift-logging
               severity: info
             exp_annotations:
               summary: "ES process CPU usage is high"
@@ -180,6 +187,7 @@ tests:
         exp_alerts:
           - exp_labels:
               name: elasticsearch-operator.currentversion-builddate
+              namespace: openshift-logging
               severity: warning
             exp_annotations:
               summary: "Elasticsearch Operator CSV Not Successful"