You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@camel.apache.org by as...@apache.org on 2020/11/10 10:20:17 UTC
[camel-k] 17/25: feat: Add default alerting rule for build error SLO
This is an automated email from the ASF dual-hosted git repository.
astefanutti pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/camel-k.git
commit 45ba6a097d8b204f60764091745412ec8c777010
Author: Antonin Stefanutti <an...@stefanutti.fr>
AuthorDate: Wed Oct 21 18:39:23 2020 +0200
feat: Add default alerting rule for build error SLO
---
deploy/operator-prometheus-rule.yaml | 15 ++++++++++++++-
1 file changed, 14 insertions(+), 1 deletion(-)
diff --git a/deploy/operator-prometheus-rule.yaml b/deploy/operator-prometheus-rule.yaml
index ab4e837..83f056a 100644
--- a/deploy/operator-prometheus-rule.yaml
+++ b/deploy/operator-prometheus-rule.yaml
@@ -70,7 +70,7 @@ spec:
for {{ $labels.job }} have their duration above 5m.
- alert: CamelKBuildFailure
expr: |
- sum(rate(camel_k_build_duration_seconds_count{result="Error"}[5m])) by (job)
+ sum(rate(camel_k_build_duration_seconds_count{result="Failed"}[5m])) by (job)
/
sum(rate(camel_k_build_duration_seconds_count[5m])) by (job)
* 100
@@ -81,6 +81,19 @@ spec:
annotations:
message: |
{{ printf "%0.0f" $value }}% of the builds for {{ $labels.job }} have failed.
+ - alert: CamelKBuildError
+ expr: |
+ sum(rate(camel_k_build_duration_seconds_count{result="Error"}[5m])) by (job)
+ /
+ sum(rate(camel_k_build_duration_seconds_count[5m])) by (job)
+ * 100
+ > 1
+ for: 10m
+ labels:
+ severity: critical
+ annotations:
+ message: |
+ {{ printf "%0.0f" $value }}% of the builds for {{ $labels.job }} have errored.
- alert: CamelKBuildQueueDuration1m
expr: |
(