From 1c0d33c53a0aba3a943b23009b9f97a16f13a9ad Mon Sep 17 00:00:00 2001 From: Gero Posmyk-Leinemann Date: Thu, 21 Sep 2023 12:40:36 +0000 Subject: [PATCH] [alerts] Exclude reason "imageBuildFailedUser" from InstanceStartFailures --- operations/observability/mixins/meta/rules/server.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/operations/observability/mixins/meta/rules/server.yaml b/operations/observability/mixins/meta/rules/server.yaml index a21ca6dad301c6..429fd0b959c703 100644 --- a/operations/observability/mixins/meta/rules/server.yaml +++ b/operations/observability/mixins/meta/rules/server.yaml @@ -35,7 +35,7 @@ spec: - alert: InstanceStartFailures # Reasoning: 1 failure every 120s should not trigger an incident: 1/120 = 0.00833.. => 0.01 - expr: sum(irate(gitpod_server_instance_starts_failed_total{reason!~"imageBuildFailed"}[2m])) by (reason) > 0.01 + expr: sum(irate(gitpod_server_instance_starts_failed_total{reason!~"imageBuildFailed|imageBuildFailedUser"}[2m])) by (reason) > 0.01 for: 30s labels: severity: critical