From 955d81416ee1e92ab5f279b1475be750316e8475 Mon Sep 17 00:00:00 2001
From: Patrick Donnelly <pdonnell@redhat.com>
Date: Fri, 15 Feb 2019 11:57:43 -0800
Subject: [PATCH] MDSMonitor: do not assign standby-replay when degraded

The journal (or potentially other rank metadata) may be in the process of being
migrated or modified.

Fixes: http://tracker.ceph.com/issues/36384
Signed-off-by: Patrick Donnelly <pdonnell@redhat.com>
(cherry picked from commit 065e98edfb26c1bbf9779e1094b966ac428247c5)
---
 src/mon/MDSMonitor.cc | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)
diff --git a/src/mon/MDSMonitor.cc b/src/mon/MDSMonitor.cc
index 7be5f14f77a65..4cc066fc6ec7e 100644
--- a/src/mon/MDSMonitor.cc
+++ b/src/mon/MDSMonitor.cc
@@ -2173,9 +2173,10 @@ bool MDSMonitor::maybe_promote_standby(FSMap &fsmap, std::shared_ptr<Filesystem>
 	do_propose = true;
       }
     }
-  } else {
+  } else if (!fs->mds_map.is_degraded()) {
     // There were no failures to replace, so try using any available standbys
-    // as standby-replay daemons.
+    // as standby-replay daemons. Don't do this when the cluster is degraded
+    // as a standby-replay daemon may try to read a journal being migrated.
 
     // Take a copy of the standby GIDs so that we can iterate over
     // them while perhaps-modifying standby_daemons during the loop
-- 
2.39.5