mon: allow a MON_DOWN grace period after cluster mkfs

author Sage Weil <sage@newdream.net>

Thu, 15 Jul 2021 20:17:23 +0000 (15:17 -0500)

committer Laura Flores <lflores@redhat.com>

Wed, 19 Oct 2022 21:20:15 +0000 (21:20 +0000)
author Sage Weil <sage@newdream.net>
Thu, 15 Jul 2021 20:17:23 +0000 (15:17 -0500)
committer Laura Flores <lflores@redhat.com>
Wed, 19 Oct 2022 21:20:15 +0000 (21:20 +0000)
diff --git a/src/common/options.cc b/src/common/options.cc

index 89731a5bbd7791693fb4be74ab02ae3b95dd12f8..b0239e24aa4d3ebe94f2f9700e09edbfd3ec1a01 100644 (file)
--- a/src/common/options.cc
+++ b/src/common/options.cc
@@ -5634,6 +5634,11 @@ std::vector<Option> get_global_options() {
      .set_description("Period in seconds between monitor-to-manager "
                       "health/status updates"),
  
+    Option("mon_down_mkfs_grace", Option::TYPE_SECS, Option::LEVEL_ADVANCED)
+    .set_default(60)
+    .add_service("mon")
+    .set_description("Period in seconds that the cluster may have a mon down after cluster creation"),
+
      Option("mon_mgr_beacon_grace", Option::TYPE_SECS, Option::LEVEL_ADVANCED)
      .set_default(30)
      .add_service("mon")
diff --git a/src/mon/HealthMonitor.cc b/src/mon/HealthMonitor.cc

index ae92e8b77521bf8806f1a4d676baf343335536ad..a45159e7c669c4e4d4620dbe4fe124430769b4a8 100644 (file)
--- a/src/mon/HealthMonitor.cc
+++ b/src/mon/HealthMonitor.cc
@@ -798,7 +798,9 @@ void HealthMonitor::check_for_mon_down(health_check_map_t *checks)
  {
    int max = mon.monmap->size();
    int actual = mon.get_quorum().size();
-  if (actual < max) {
+  const auto now = ceph::real_clock::now();
+  if (actual < max &&
+      now > mon.monmap->created.to_real_time() + g_conf().get_val<std::chrono::seconds>("mon_down_mkfs_grace")) {
      ostringstream ss;
      ss << (max-actual) << "/" << max << " mons down, quorum "
         << mon.get_quorum_names();
author	Sage Weil <sage@newdream.net>
	Thu, 15 Jul 2021 20:17:23 +0000 (15:17 -0500)
committer	Laura Flores <lflores@redhat.com>
	Wed, 19 Oct 2022 21:20:15 +0000 (21:20 +0000)
src/common/options.cc		patch \| blob \| history
src/mon/HealthMonitor.cc		patch \| blob \| history