From e205901dd912c673404231005ae9f2f998d4e560 Mon Sep 17 00:00:00 2001 From: Bastian Eicher Date: Wed, 3 Jan 2024 20:50:48 +0100 Subject: [PATCH] Improved log alerting to sum message count over pods --- charts/generic-service/templates/alerts-logs.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/charts/generic-service/templates/alerts-logs.yaml b/charts/generic-service/templates/alerts-logs.yaml index a9bb6ef..18228b2 100644 --- a/charts/generic-service/templates/alerts-logs.yaml +++ b/charts/generic-service/templates/alerts-logs.yaml @@ -11,7 +11,7 @@ spec: rules: {{- range $level, $options := .Values.alerting.logs.levels }} - alert: LogMessages{{ $level | title }} - expr: count_over_time(({namespace="{{ $.Release.Namespace }}", container="{{ include "generic-service.fullname" $ }}", {{ $.Values.alerting.logs.levelLabel }}="{{ $level }}"})[{{ $.Values.alerting.logs.countInterval }}]) > {{ $options.maxCount | default 0 }} + expr: sum(count_over_time(({namespace="{{ $.Release.Namespace }}", container="{{ include "generic-service.fullname" $ }}", {{ $.Values.alerting.logs.levelLabel }}="{{ $level }}"})[{{ $.Values.alerting.logs.countInterval }}])) > {{ $options.maxCount | default 0 }} for: 1s labels: {{- include "generic-service.alert-labels" $ | nindent 12 }} {{ $options.severity | default "warning" }} topic: logs