Skip to content

Commit

Permalink
Add prometheus alerts for Tide pool errors.
Browse files Browse the repository at this point in the history
  • Loading branch information
cjwagner committed Oct 18, 2019
1 parent 99c2185 commit 70005b2
Showing 1 changed file with 26 additions and 0 deletions.
26 changes: 26 additions & 0 deletions prow/cluster/monitoring/mixins/prometheus/tide_alerts.libsonnet
Expand Up @@ -48,6 +48,32 @@
message: 'The Tide status update controllers loop period has averaged more than 2 minutes for the last 15 mins.',
},
},
{
alert: 'TidePoolErrorRateIndividual',
expr: |||
(max(sum(increase(tidepoolerrors[10m])) by (org, repo, branch)) or vector(0)) >= 3
|||,
'for': '5m',
labels: {
severity: 'warning',
},
annotations: {
message: 'At least one Tide pool encountered 3+ sync errors in a 10 minute window. If the TidePoolErrorRateMultiple alert has not fired this is likely an isolated configuration issue. See the <deck-url>/tide-history page.',
},
},
{
alert: 'TidePoolErrorRateMultiple',
expr: |||
(count(sum(increase(tidepoolerrors[10m])) by (org, repo) >= 3) or vector(0)) >= 3
|||,
'for': '5m',
labels: {
severity: 'critical',
},
annotations: {
message: 'Tide encountered 3+ sync errors in a 10 minute window in at least 3 different repos that it handles. See the <deck-url>/tide-history page.',
},
},
],
},
],
Expand Down

0 comments on commit 70005b2

Please sign in to comment.