X-Git-Url: https://gerrit.fd.io/r/gitweb?a=blobdiff_plain;f=terraform-ci-infra%2F1n_nmd%2Fprometheus%2Fconf%2Fnomad%2Fprometheus.hcl;fp=terraform-ci-infra%2F1n_nmd%2Fprometheus%2Fconf%2Fnomad%2Fprometheus.hcl;h=235a04228cd60cb03159daad5a9009c29d0e7356;hb=5551ffb9e6fb4f6de54331d9105bc1e4bbd0641e;hp=d851628fcdc31663bb866db3e59070fe62981cec;hpb=85785b4fac91e2bc443d4b62b80df418d8a99699;p=csit.git diff --git a/terraform-ci-infra/1n_nmd/prometheus/conf/nomad/prometheus.hcl b/terraform-ci-infra/1n_nmd/prometheus/conf/nomad/prometheus.hcl index d851628fcd..235a04228c 100644 --- a/terraform-ci-infra/1n_nmd/prometheus/conf/nomad/prometheus.hcl +++ b/terraform-ci-infra/1n_nmd/prometheus/conf/nomad/prometheus.hcl @@ -191,7 +191,7 @@ groups: - name: "Jenkins Job Health Exporter" rules: - alert: JenkinsJobHealthExporterFailures - expr: jenkins_job_failure{id=~".*"} >= 10 + expr: jenkins_job_failure{id=~".*"} > jenkins_job_success{id=~".*"} for: 0m labels: severity: critical @@ -199,7 +199,7 @@ groups: summary: "Jenkins Job Health detected high failure rate on jenkins jobs." description: "Job: {{ $labels.id }}" - alert: JenkinsJobHealthExporterUnstable - expr: jenkins_job_unstable{id=~".*"} >= 10 + expr: jenkins_job_unstable{id=~".*"} > jenkins_job_success{id=~".*"} for: 0m labels: severity: warning