mon: add 'mds reset_cluster' command

author Sage Weil <sage@newdream.net>

Thu, 27 Jan 2011 16:15:23 +0000 (08:15 -0800)

committer Sage Weil <sage@newdream.net>

Thu, 27 Jan 2011 16:34:29 +0000 (08:34 -0800)
author Sage Weil <sage@newdream.net>
Thu, 27 Jan 2011 16:15:23 +0000 (08:15 -0800)
committer Sage Weil <sage@newdream.net>
Thu, 27 Jan 2011 16:34:29 +0000 (08:34 -0800)
diff --git a/src/mon/MDSMonitor.cc b/src/mon/MDSMonitor.cc

index a9d181249e65923bc7bfc128ca644b749430a0bb..340edce178dfedabbc2d4dc281ecaa059c81e7b8 100644 (file)
--- a/src/mon/MDSMonitor.cc
+++ b/src/mon/MDSMonitor.cc
@@ -625,6 +625,47 @@ int MDSMonitor::fail_mds(std::ostream &ss, const std::string &arg)
    return 0;
  }
  
+int MDSMonitor::reset_cluster(std::ostream &ss)
+{
+  dout(10) << "reset_cluster" << dendl;
+
+  if (pending_mdsmap.up.size() && !mon->osdmon()->paxos->is_writeable()) {
+    ss << "osdmap not writeable, can't blacklist up mds's";
+    return -EAGAIN;
+  }
+
+  // --- reset the cluster map ---
+  pending_mdsmap.stopped.insert(pending_mdsmap.in.begin(),
+                               pending_mdsmap.in.end());
+  pending_mdsmap.in.clear();
+  pending_mdsmap.stopped.insert(pending_mdsmap.failed.begin(),
+                               pending_mdsmap.failed.end());
+  pending_mdsmap.failed.clear();
+  
+  pending_mdsmap.stopped.erase(0);
+  pending_mdsmap.failed.insert(0);
+  pending_mdsmap.in.insert(0);
+
+  if (pending_mdsmap.mds_info.size()) {
+    // blacklist all old mds's
+    utime_t until = g_clock.now();
+    until += g_conf.mds_blacklist_interval;
+    for (map<int32_t,uint64_t>::iterator p = pending_mdsmap.up.begin();
+        p != pending_mdsmap.up.end();
+        ++p) {
+      MDSMap::mds_info_t& info = pending_mdsmap.mds_info[p->second];
+      dout(10) << " blacklisting gid " << p->second << " " << info.addr << dendl;
+      pending_mdsmap.last_failure_osd_epoch = mon->osdmon()->blacklist(info.addr, until);
+    }
+    mon->osdmon()->propose_pending();
+  }
+  pending_mdsmap.up.clear();
+  pending_mdsmap.mds_info.clear();
+
+  ss << "reset mds cluster to single mds";
+  return 0;
+}
+
  bool MDSMonitor::prepare_command(MMonCommand *m)
  {
    int r = -EINVAL;
@@ -703,6 +744,9 @@ bool MDSMonitor::prepare_command(MMonCommand *m)
        paxos->wait_for_commit(new Monitor::C_Command(mon, m, 0, rs, paxos->get_version()));
        return true;
      }
+    else if (m->cmd[1] == "cluster_reset") {
+      r = reset_cluster(ss);
+    }
      else if (m->cmd[1] == "compat" && m->cmd.size() == 4) {
        uint64_t f = atoll(m->cmd[3].c_str());
        if (m->cmd[2] == "rm_compat") {
diff --git a/src/mon/MDSMonitor.h b/src/mon/MDSMonitor.h

index 528acec1abf8d25978a760b712cd37a5e32fa3d7..372804b419ee425e76d7c32881f9041dbfd6efb1 100644 (file)
--- a/src/mon/MDSMonitor.h
+++ b/src/mon/MDSMonitor.h
@@ -87,8 +87,10 @@ class MDSMonitor : public PaxosService {
    bool prepare_offload_targets(MMDSLoadTargets *m);
  
    enum health_status_t get_health(std::ostream &ss) const;
-  bool preprocess_command(MMonCommand *m);
    int fail_mds(std::ostream &ss, const std::string &arg);
+  int reset_cluster(std::ostream &ss);
+
+  bool preprocess_command(MMonCommand *m);
    bool prepare_command(MMonCommand *m);
  
    // beacons
author	Sage Weil <sage@newdream.net>
	Thu, 27 Jan 2011 16:15:23 +0000 (08:15 -0800)
committer	Sage Weil <sage@newdream.net>
	Thu, 27 Jan 2011 16:34:29 +0000 (08:34 -0800)
src/mon/MDSMonitor.cc		patch \| blob \| history
src/mon/MDSMonitor.h		patch \| blob \| history