osd/PrimaryLogPG: avoid infinite loop when flush collides with write lock

author Sage Weil <sage@redhat.com>

Wed, 25 Apr 2018 20:32:38 +0000 (15:32 -0500)

committer Sage Weil <sage@redhat.com>

Wed, 25 Apr 2018 20:34:21 +0000 (15:34 -0500)
author Sage Weil <sage@redhat.com>
Wed, 25 Apr 2018 20:32:38 +0000 (15:32 -0500)
committer Sage Weil <sage@redhat.com>
Wed, 25 Apr 2018 20:34:21 +0000 (15:34 -0500)
diff --git a/src/osd/PrimaryLogPG.cc b/src/osd/PrimaryLogPG.cc

index a5c260740f8e609d2887661c8991b4d8943470e7..3b18934b4eb1af220099fb0dcd27684cc2d575fc 100644 (file)
--- a/src/osd/PrimaryLogPG.cc
+++ b/src/osd/PrimaryLogPG.cc
@@ -10009,10 +10009,18 @@ int PrimaryLogPG::try_flush_mark_clean(FlushOpRef fop)
         fop->op)) {
      dout(20) << __func__ << " took write lock" << dendl;
    } else if (fop->op) {
-    dout(10) << __func__ << " waiting on write lock" << dendl;
+    dout(10) << __func__ << " waiting on write lock " << fop->op << " "
+            << fop->dup_ops << dendl;
      close_op_ctx(ctx.release());
-    requeue_op(fop->op);
-    requeue_ops(fop->dup_ops);
+    // fop->op is now waiting on the lock; get fop->dup_ops to wait too.
+    for (auto op : fop->dup_ops) {
+      bool locked = ctx->lock_manager.get_lock_type(
+       ObjectContext::RWState::RWWRITE,
+       oid,
+       obc,
+       op);
+      assert(!locked);
+    }
      return -EAGAIN;    // will retry
    } else {
      dout(10) << __func__ << " failed write lock, no op; failing" << dendl;
author	Sage Weil <sage@redhat.com>
	Wed, 25 Apr 2018 20:32:38 +0000 (15:32 -0500)
committer	Sage Weil <sage@redhat.com>
	Wed, 25 Apr 2018 20:34:21 +0000 (15:34 -0500)