From 03484c5b22948ed970d5cabf24a2aedd72afcc64 Mon Sep 17 00:00:00 2001 From: Arun Kumar Mohan Date: Fri, 1 Oct 2021 15:50:44 +0530 Subject: [PATCH] Adding namespace field into other alert queries Signed-off-by: Arun Kumar Mohan --- alerts/absent_alerts.libsonnet | 4 ++-- alerts/monquorum.libsonnet | 2 +- alerts/state.libsonnet | 2 +- extras/manifests/prometheus-ceph-rules.yaml | 8 ++++---- 4 files changed, 8 insertions(+), 8 deletions(-) diff --git a/alerts/absent_alerts.libsonnet b/alerts/absent_alerts.libsonnet index b032117..b2da4ab 100644 --- a/alerts/absent_alerts.libsonnet +++ b/alerts/absent_alerts.libsonnet @@ -23,7 +23,7 @@ { alert: 'CephMgrIsMissingReplicas', expr: ||| - sum(up{%(cephExporterSelector)s}) < %(cephMgrCount)d + sum(up{%(cephExporterSelector)s}) by (namespace) < %(cephMgrCount)d ||| % $._config, 'for': $._config.mgrMissingReplicasAlertTime, labels: { @@ -44,7 +44,7 @@ { alert: 'CephMdsMissingReplicas', expr: ||| - sum(ceph_mds_metadata{%(cephExporterSelector)s} == 1) < %(cephMdsCount)d + sum(ceph_mds_metadata{%(cephExporterSelector)s} == 1) by (namespace) < %(cephMdsCount)d ||| % $._config, 'for': $._config.mdsMissingReplicasAlertTime, labels: { diff --git a/alerts/monquorum.libsonnet b/alerts/monquorum.libsonnet index b86a8e9..33a6da3 100644 --- a/alerts/monquorum.libsonnet +++ b/alerts/monquorum.libsonnet @@ -7,7 +7,7 @@ { alert: 'CephMonQuorumAtRisk', expr: ||| - count(ceph_mon_quorum_status{%s} == 1) <= (floor(count(ceph_mon_metadata{%s}) / 2) + 1) + count(ceph_mon_quorum_status{%s} == 1) by (namespace) <= (floor(count(ceph_mon_metadata{%s}) by (namespace) / 2) + 1) ||| % [$._config.cephExporterSelector, $._config.cephExporterSelector], 'for': $._config.monQuorumAlertTime, labels: { diff --git a/alerts/state.libsonnet b/alerts/state.libsonnet index 1468da7..5300187 100644 --- a/alerts/state.libsonnet +++ b/alerts/state.libsonnet @@ -39,7 +39,7 @@ { alert: 'CephOSDVersionMismatch', expr: ||| - count(count(ceph_osd_metadata{%(cephExporterSelector)s}) by (ceph_version)) > 1 + count(count(ceph_osd_metadata{%(cephExporterSelector)s}) by (ceph_version, namespace)) by (ceph_version, namespace) > 1 ||| % $._config, 'for': $._config.clusterVersionAlertTime, labels: { diff --git a/extras/manifests/prometheus-ceph-rules.yaml b/extras/manifests/prometheus-ceph-rules.yaml index cc46355..cc4b370 100644 --- a/extras/manifests/prometheus-ceph-rules.yaml +++ b/extras/manifests/prometheus-ceph-rules.yaml @@ -53,7 +53,7 @@ spec: severity_level: warning storage_type: ceph expr: | - sum(up{job="rook-ceph-mgr"}) < 1 + sum(up{job="rook-ceph-mgr"}) by (namespace) < 1 for: 5m labels: severity: warning @@ -66,7 +66,7 @@ spec: severity_level: warning storage_type: ceph expr: | - sum(ceph_mds_metadata{job="rook-ceph-mgr"} == 1) < 2 + sum(ceph_mds_metadata{job="rook-ceph-mgr"} == 1) by (namespace) < 2 for: 5m labels: severity: warning @@ -79,7 +79,7 @@ spec: severity_level: error storage_type: ceph expr: | - count(ceph_mon_quorum_status{job="rook-ceph-mgr"} == 1) <= (floor(count(ceph_mon_metadata{job="rook-ceph-mgr"}) / 2) + 1) + count(ceph_mon_quorum_status{job="rook-ceph-mgr"} == 1) by (namespace) <= (floor(count(ceph_mon_metadata{job="rook-ceph-mgr"}) by (namespace) / 2) + 1) for: 15m labels: severity: critical @@ -252,7 +252,7 @@ spec: severity_level: warning storage_type: ceph expr: | - count(count(ceph_osd_metadata{job="rook-ceph-mgr"}) by (ceph_version)) > 1 + count(count(ceph_osd_metadata{job="rook-ceph-mgr"}) by (ceph_version, namespace)) by (ceph_version, namespace) > 1 for: 10m labels: severity: warning