]> git.apps.os.sepia.ceph.com Git - ceph.git/commitdiff
monitoring: alert for prediction of disk and pool fill up broken 34395/head
authorPatrick Seidensal <pseidensal@suse.com>
Thu, 26 Mar 2020 21:49:57 +0000 (22:49 +0100)
committerVolker Theile <vtheile@suse.com>
Fri, 3 Apr 2020 10:25:53 +0000 (12:25 +0200)
Fixes: https://tracker.ceph.com/issues/44776
Signed-off-by: Patrick Seidensal <pseidensal@suse.com>
(cherry picked from commit 6935dc55921ef533e939719bad7dc12324450bbb)

Conflicts:
  monitoring/prometheus/alerts/ceph_default_alerts.yml

monitoring/prometheus/alerts/ceph_default_alerts.yml

index a9b0560d4730b8ff9736d110c9377f39e25f44ec..7bb3b9352fcfe7d5e72d5f0cde8dfcb21910a25d 100644 (file)
@@ -199,15 +199,10 @@ groups:
             Node {{ $labels.instance }} experiences packet errors > 1
             packet/s on interface {{ $labels.device }}.
 
-      # predict fs fill-up times
-      - alert: storage filling
+      - alert: storage filling up
         expr: |
-          (
-            (
-              node_filesystem_free_bytes / deriv(node_filesystem_free_bytes[2d])
-              * on(instance) group_left(nodename) node_uname_info
-            ) <= 5
-          ) > 0
+          predict_linear(node_filesystem_free_bytes[2d], 3600 * 24 * 5) *
+          on(instance) group_left(nodename) node_uname_info < 0
         labels:
           severity: warning
           type: ceph_default
@@ -234,10 +229,9 @@ groups:
       - alert: pool filling up
         expr: |
           (
-            (
-              (ceph_pool_max_avail - ceph_pool_stored) / deriv(ceph_pool_max_avail[2d])
-            ) * on(pool_id) group_right ceph_pool_metadata <= 5
-          ) > 0
+            predict_linear(ceph_pool_stored[2d], 3600 * 24 * 5) >=
+            ceph_pool_max_avail
+          ) * on(pool_id) group_right(name) ceph_pool_metadata
         labels:
           severity: warning
           type: ceph_default