rules:
- alert: root volume full
expr: node_filesystem_avail_bytes{mountpoint="/"} / node_filesystem_size_bytes{mountpoint="/"} * 100 < 5
+ for: 5m
labels:
severity: critical
type: ceph_default
Node {{ $labels.instance }} experiences packet errors > 1
packet/s on interface {{ $labels.device }}.
- # predict fs fill-up times
- - alert: storage filling
+ - alert: storage filling up
expr: |
- (
- (
- node_filesystem_free_bytes / deriv(node_filesystem_free_bytes[2d])
- * on(instance) group_left(nodename) node_uname_info
- ) <= 5
- ) > 0
+ predict_linear(node_filesystem_free_bytes[2d], 3600 * 24 * 5) *
+ on(instance) group_left(nodename) node_uname_info < 0
labels:
severity: warning
type: ceph_default
- alert: pool filling up
expr: |
(
- (
- (ceph_pool_max_avail - ceph_pool_stored) / deriv(ceph_pool_max_avail[2d])
- ) * on(pool_id) group_right ceph_pool_metadata <= 5
- ) > 0
+ predict_linear(ceph_pool_stored[2d], 3600 * 24 * 5) >=
+ ceph_pool_max_avail
+ ) * on(pool_id) group_right(name) ceph_pool_metadata
labels:
severity: warning
type: ceph_default