mds: fix handling very fast delete ops

author John Spray <john.spray@redhat.com>

Thu, 9 Mar 2017 10:43:32 +0000 (10:43 +0000)

committer John Spray <john.spray@redhat.com>

Thu, 9 Mar 2017 11:28:51 +0000 (11:28 +0000)
author John Spray <john.spray@redhat.com>
Thu, 9 Mar 2017 10:43:32 +0000 (10:43 +0000)
committer John Spray <john.spray@redhat.com>
Thu, 9 Mar 2017 11:28:51 +0000 (11:28 +0000)
diff --git a/src/mds/PurgeQueue.cc b/src/mds/PurgeQueue.cc

index f9617b81643b90c530272da506110ca210aedf12..7bea41bfab3a0ad3d09afdabb77534ed1d1b8d79 100644 (file)
--- a/src/mds/PurgeQueue.cc
+++ b/src/mds/PurgeQueue.cc
@@ -398,16 +398,40 @@ void PurgeQueue::_execute_item(
    assert(gather.has_subs());
  
    gather.set_finisher(new FunctionContext([this, expire_to](int r){
-    execute_item_complete(expire_to);
+    if (lock.is_locked_by_me()) {
+      // Fast completion, Objecter ops completed before we hit gather.activate()
+      // and we're being called inline.  We are still inside _consume so
+      // no need to call back into it.
+      _execute_item_complete(expire_to);
+    } else {
+      // Normal completion, we're being called back from outside PurgeQueue::lock
+      // by the Objecter.  Take the lock, and call back into _consume to
+      // find more work.
+      Mutex::Locker l(lock);
+      _execute_item_complete(expire_to);
+
+      _consume();
+    }
+
+    // Have we gone idle?  If so, do an extra write_head now instead of
+    // waiting for next flush after journaler_write_head_interval.
+    // Also do this periodically even if not idle, so that the persisted
+    // expire_pos doesn't fall too far behind our progress when consuming
+    // a very long queue.
+    if (in_flight.empty() || journaler.write_head_needed()) {
+      journaler.write_head(new FunctionContext([this](int r){
+            journaler.trim();
+            }));
+    }
    }));
    gather.activate();
  }
  
-void PurgeQueue::execute_item_complete(
+void PurgeQueue::_execute_item_complete(
      uint64_t expire_to)
  {
+  assert(lock.is_locked_by_me());
    dout(10) << "complete at 0x" << std::hex << expire_to << std::dec << dendl;
-  Mutex::Locker l(lock);
    assert(in_flight.count(expire_to) == 1);
  
    auto iter = in_flight.find(expire_to);
@@ -434,19 +458,6 @@ void PurgeQueue::execute_item_complete(
    dout(10) << "in_flight.size() now " << in_flight.size() << dendl;
  
    logger->inc(l_pq_executed);
-
-  _consume();
-
-  // Have we gone idle?  If so, do an extra write_head now instead of
-  // waiting for next flush after journaler_write_head_interval.
-  // Also do this periodically even if not idle, so that the persisted
-  // expire_pos doesn't fall too far behind our progress when consuming
-  // a very long queue.
-  if (in_flight.empty() || journaler.write_head_needed()) {
-    journaler.write_head(new FunctionContext([this](int r){
-          journaler.trim();
-          }));
-  }
  }
  
  void PurgeQueue::update_op_limit(const MDSMap &mds_map)
diff --git a/src/mds/PurgeQueue.h b/src/mds/PurgeQueue.h

index a0b0346137843fe900db729e1f811557dfb146c7..33b8c8617998a8c5cfc87489336cc5b254d38e04 100644 (file)
--- a/src/mds/PurgeQueue.h
+++ b/src/mds/PurgeQueue.h
@@ -124,7 +124,7 @@ protected:
    void _execute_item(
        const PurgeItem &item,
        uint64_t expire_to);
-  void execute_item_complete(
+  void _execute_item_complete(
        uint64_t expire_to);
author	John Spray <john.spray@redhat.com>
	Thu, 9 Mar 2017 10:43:32 +0000 (10:43 +0000)
committer	John Spray <john.spray@redhat.com>
	Thu, 9 Mar 2017 11:28:51 +0000 (11:28 +0000)
src/mds/PurgeQueue.cc		patch \| blob \| history
src/mds/PurgeQueue.h		patch \| blob \| history