Skip to content

Commit

Permalink
Merge pull request #94 from aruniiird/all-alert-interval-changes
Browse files Browse the repository at this point in the history
All alert interval changes
  • Loading branch information
umangachapagain committed Feb 2, 2022
2 parents 2464af2 + 922df79 commit c77ec28
Show file tree
Hide file tree
Showing 4 changed files with 8 additions and 5 deletions.
4 changes: 2 additions & 2 deletions alerts/osd.libsonnet
Expand Up @@ -57,7 +57,7 @@
expr: |||
label_replace((ceph_osd_in == 1 and ceph_osd_up == 0),"disk","$1","ceph_daemon","osd.(.*)") + on(ceph_daemon) group_left(host, device) label_replace(ceph_disk_occupation,"host","$1","exported_instance","(.*)")
||| % $._config,
'for': $._config.osdDiskAlertTime,
'for': $._config.osdDiskNotRespondingTime,
labels: {
severity: 'critical',
},
Expand All @@ -73,7 +73,7 @@
expr: |||
label_replace((ceph_osd_in == 0 and ceph_osd_up == 0),"disk","$1","ceph_daemon","osd.(.*)") + on(ceph_daemon) group_left(host, device) label_replace(ceph_disk_occupation,"host","$1","exported_instance","(.*)")
||| % $._config,
'for': $._config.osdDiskAlertTime,
'for': $._config.osdDiskUnavailableTime,
labels: {
severity: 'critical',
},
Expand Down
2 changes: 1 addition & 1 deletion alerts/state.libsonnet
Expand Up @@ -25,7 +25,7 @@
expr: |||
ceph_health_status{%(cephExporterSelector)s} == 1
||| % $._config,
'for': $._config.clusterStateAlertTime,
'for': $._config.clusterWarningStateAlertTime,
labels: {
severity: 'warning',
},
Expand Down
3 changes: 3 additions & 0 deletions config.libsonnet
Expand Up @@ -11,6 +11,7 @@
// Duration to raise various Alerts
cephNodeDownAlertTime: '30s',
clusterStateAlertTime: '10m',
clusterWarningStateAlertTime: '15m',
clusterVersionAlertTime: '10m',
clusterUtilizationAlertTime: '5s',
clusterReadOnlyAlertTime: '0s',
Expand All @@ -20,6 +21,8 @@
osdDataRebalanceAlertTime: '15s',
osdDataRecoveryAlertTime: '2h',
osdDataRecoveryInProgressAlertTime: '30s',
osdDiskNotRespondingTime: '15m',
osdDiskUnavailableTime: '1m',
osdDiskAlertTime: '1m',
osdDownAlertTime: '5m',
osdFlapAlertTime: '0s',
Expand Down
4 changes: 2 additions & 2 deletions extras/manifests/prometheus-ceph-rules.yaml
Expand Up @@ -150,7 +150,7 @@ spec:
storage_type: ceph
expr: |
label_replace((ceph_osd_in == 1 and ceph_osd_up == 0),"disk","$1","ceph_daemon","osd.(.*)") + on(ceph_daemon) group_left(host, device) label_replace(ceph_disk_occupation,"host","$1","exported_instance","(.*)")
for: 1m
for: 15m
labels:
severity: critical
- alert: CephOSDDiskUnavailable
Expand Down Expand Up @@ -242,7 +242,7 @@ spec:
storage_type: ceph
expr: |
ceph_health_status{job="rook-ceph-mgr"} == 1
for: 10m
for: 15m
labels:
severity: warning
- alert: CephOSDVersionMismatch
Expand Down

0 comments on commit c77ec28

Please sign in to comment.