mon: Monitor: adaptative clock skew detection interval

author Joao Eduardo Luis <joao@suse.de>

Thu, 7 Jan 2016 11:05:44 +0000 (11:05 +0000)

committer Xiaoxi Chen <xiaoxchen@ebay.com>

Mon, 14 Mar 2016 00:48:05 +0000 (17:48 -0700)
author Joao Eduardo Luis <joao@suse.de>
Thu, 7 Jan 2016 11:05:44 +0000 (11:05 +0000)
committer Xiaoxi Chen <xiaoxchen@ebay.com>
Mon, 14 Mar 2016 00:48:05 +0000 (17:48 -0700)
diff --git a/src/common/config_opts.h b/src/common/config_opts.h

index 76763e4ee9bde39545684088e4f1ee67a9e6bc38..f774ca9f7796372e781274c772a55e154d79af82 100644 (file)
--- a/src/common/config_opts.h
+++ b/src/common/config_opts.h
@@ -204,6 +204,7 @@ OPTION(mon_clock_drift_allowed, OPT_FLOAT, .050) // allowed clock drift between
  OPTION(mon_clock_drift_warn_backoff, OPT_FLOAT, 5) // exponential backoff for clock drift warnings
  OPTION(mon_timecheck_interval, OPT_FLOAT, 300.0) // on leader, timecheck (clock drift check) interval (seconds)
  OPTION(mon_accept_timeout, OPT_FLOAT, 10.0)    // on leader, if paxos update isn't accepted
+OPTION(mon_timecheck_skew_interval, OPT_FLOAT, 30.0) // on leader, timecheck (clock drift check) interval when in presence of a skew (seconds)
  OPTION(mon_pg_create_interval, OPT_FLOAT, 30.0) // no more than every 30s
  OPTION(mon_pg_stuck_threshold, OPT_INT, 300) // number of seconds after which pgs can be considered inactive, unclean, or stale (see doc/control.rst under dump_stuck for more info)
  OPTION(mon_pg_warn_min_per_osd, OPT_INT, 30)  // min # pgs per (in) osd before we warn the admin
diff --git a/src/mon/Monitor.cc b/src/mon/Monitor.cc

index d62d7cf1e1cc4379f7745431a0d9807e182cd67a..7662f07faa157c30b76580a56d79150e162a9654 100644 (file)
--- a/src/mon/Monitor.cc
+++ b/src/mon/Monitor.cc
@@ -178,6 +178,7 @@ Monitor::Monitor(CephContext* cct_, string nm, MonitorDBStore *s,
  
    timecheck_round(0),
    timecheck_acks(0),
+  timecheck_rounds_since_clean(0),
    timecheck_event(NULL),
  
    probe_timeout_event(NULL),
@@ -3685,8 +3686,7 @@ void Monitor::timecheck_start_round()
    timecheck();
  out:
    dout(10) << __func__ << " setting up next event" << dendl;
-  timecheck_event = new C_TimeCheck(this);
-  timer.add_event_after(g_conf->mon_timecheck_interval, timecheck_event);
+  timecheck_reset_event();
  }
  
  void Monitor::timecheck_finish_round(bool success)
@@ -3700,6 +3700,7 @@ void Monitor::timecheck_finish_round(bool success)
      assert(timecheck_waiting.empty());
      assert(timecheck_acks == quorum.size());
      timecheck_report();
+    timecheck_check_skews();
      return;
    }
  
@@ -3733,6 +3734,65 @@ void Monitor::timecheck_cleanup()
    timecheck_waiting.clear();
    timecheck_skews.clear();
    timecheck_latencies.clear();
+
+  timecheck_rounds_since_clean = 0;
+}
+
+void Monitor::timecheck_reset_event()
+{
+  if (timecheck_event) {
+    timer.cancel_event(timecheck_event);
+    timecheck_event = NULL;
+  }
+
+  double delay =
+    cct->_conf->mon_timecheck_skew_interval * timecheck_rounds_since_clean;
+
+  if (delay <= 0 || delay > cct->_conf->mon_timecheck_interval) {
+    delay = cct->_conf->mon_timecheck_interval;
+  }
+
+  dout(10) << __func__ << " delay " << delay
+           << " rounds_since_clean " << timecheck_rounds_since_clean
+           << dendl;
+
+  timecheck_event = new C_TimeCheck(this);
+  timer.add_event_after(delay, timecheck_event);
+}
+
+void Monitor::timecheck_check_skews()
+{
+  dout(10) << __func__ << dendl;
+  assert(is_leader());
+  assert((timecheck_round % 2) == 0);
+  if (monmap->size() == 1) {
+    assert(0 == "We are alone; we shouldn't have gotten here!");
+    return;
+  }
+  assert(timecheck_latencies.size() == timecheck_skews.size());
+
+  bool found_skew = false;
+  for (map<entity_inst_t, double>::iterator p = timecheck_skews.begin();
+       p != timecheck_skews.end(); ++p) {
+
+    double abs_skew;
+    if (timecheck_has_skew(p->second, &abs_skew)) {
+      dout(10) << __func__
+               << " " << p->first << " skew " << abs_skew << dendl;
+      found_skew = true;
+    }
+  }
+
+  if (found_skew) {
+    ++timecheck_rounds_since_clean;
+    timecheck_reset_event();
+  } else if (timecheck_rounds_since_clean > 0) {
+    dout(1) << __func__
+      << " no clock skews found after " << timecheck_rounds_since_clean
+      << " rounds" << dendl;
+    timecheck_rounds_since_clean = 0;
+  }
+
  }
  
  void Monitor::timecheck_report()
@@ -3755,7 +3815,8 @@ void Monitor::timecheck_report()
      m->epoch = get_epoch();
      m->round = timecheck_round;
  
-    for (map<entity_inst_t, double>::iterator it = timecheck_skews.begin(); it != timecheck_skews.end(); ++it) {
+    for (map<entity_inst_t, double>::iterator it = timecheck_skews.begin();
+         it != timecheck_skews.end(); ++it) {
        double skew = it->second;
        double latency = timecheck_latencies[it->first];
  
@@ -3814,10 +3875,10 @@ health_status_t Monitor::timecheck_status(ostringstream &ss,
                                            const double latency)
  {
    health_status_t status = HEALTH_OK;
-  double abs_skew = (skew_bound > 0 ? skew_bound : -skew_bound);
    assert(latency >= 0);
  
-  if (abs_skew > g_conf->mon_clock_drift_allowed) {
+  double abs_skew;
+  if (timecheck_has_skew(skew_bound, &abs_skew)) {
      status = HEALTH_WARN;
      ss << "clock skew " << abs_skew << "s"
         << " > max " << g_conf->mon_clock_drift_allowed << "s";
diff --git a/src/mon/Monitor.h b/src/mon/Monitor.h

index 0d3978a5e78312f7de4d937befba98ce863870f3..89af554dc52a657fa6153b62eff96920571be83b 100644 (file)
--- a/src/mon/Monitor.h
+++ b/src/mon/Monitor.h
@@ -54,6 +54,7 @@
  #include "include/memory.h"
  #include "include/str_map.h"
  #include <errno.h>
+#include <cmath>
  
  
  #define CEPH_MON_PROTOCOL     13 /* cluster internal */
@@ -463,6 +464,15 @@ private:
    version_t timecheck_round;
    unsigned int timecheck_acks;
    utime_t timecheck_round_start;
+  /* When we hit a skew we will start a new round based off of
+   * 'mon_timecheck_skew_interval'. Each new round will be backed off
+   * until we hit 'mon_timecheck_interval' -- which is the typical
+   * interval when not in the presence of a skew.
+   *
+   * This variable tracks the number of rounds with skews since last clean
+   * so that we can report to the user and properly adjust the backoff.
+   */
+  uint64_t timecheck_rounds_since_clean;
    /**
     * Time Check event.
     */
@@ -482,6 +492,8 @@ private:
    void timecheck_finish_round(bool success = true);
    void timecheck_cancel_round();
    void timecheck_cleanup();
+  void timecheck_reset_event();
+  void timecheck_check_skews();
    void timecheck_report();
    void timecheck();
    health_status_t timecheck_status(ostringstream &ss,
@@ -490,6 +502,16 @@ private:
    void handle_timecheck_leader(MTimeCheck *m);
    void handle_timecheck_peon(MTimeCheck *m);
    void handle_timecheck(MTimeCheck *m);
+
+  /**
+   * Returns 'true' if this is considered to be a skew; 'false' otherwise.
+   */
+  bool timecheck_has_skew(const double skew_bound, double *abs) const {
+    double abs_skew = std::fabs(skew_bound);
+    if (abs)
+      *abs = abs_skew;
+    return (abs_skew > g_conf->mon_clock_drift_allowed);
+  }
    /**
     * @}
     */
author	Joao Eduardo Luis <joao@suse.de>
	Thu, 7 Jan 2016 11:05:44 +0000 (11:05 +0000)
committer	Xiaoxi Chen <xiaoxchen@ebay.com>
	Mon, 14 Mar 2016 00:48:05 +0000 (17:48 -0700)
src/common/config_opts.h		patch \| blob \| history
src/mon/Monitor.cc		patch \| blob \| history
src/mon/Monitor.h		patch \| blob \| history