osd: fix race between op_wq and context_queue

author Sage Weil <sage@redhat.com>

Thu, 25 Oct 2018 19:24:02 +0000 (14:24 -0500)

committer Sage Weil <sage@redhat.com>

Fri, 26 Oct 2018 15:27:09 +0000 (10:27 -0500)
author Sage Weil <sage@redhat.com>
Thu, 25 Oct 2018 19:24:02 +0000 (14:24 -0500)
committer Sage Weil <sage@redhat.com>
Fri, 26 Oct 2018 15:27:09 +0000 (10:27 -0500)
diff --git a/src/osd/OSD.cc b/src/osd/OSD.cc

index 0c07b1b2945b1fa9426c50c30f0e856894142873..5479b598dc63fb3d85d5fbc07b986b0b7f56b047 100644 (file)
--- a/src/osd/OSD.cc
+++ b/src/osd/OSD.cc
@@ -10196,17 +10196,21 @@ void OSD::ShardedOpWQ::_process(uint32_t thread_index, heartbeat_handle_d *hb)
    auto& sdata = osd->shards[shard_index];
    ceph_assert(sdata);
  
-  // If all threads of shards do oncommits, there is a out-of-order problem.
-  // So we choose the thread which has the smallest thread_index(thread_index < num_shards) of shard
-  // to do oncommit callback.
+  // If all threads of shards do oncommits, there is a out-of-order
+  // problem.  So we choose the thread which has the smallest
+  // thread_index(thread_index < num_shards) of shard to do oncommit
+  // callback.
    bool is_smallest_thread_index = thread_index < osd->num_shards;
  
    // peek at spg_t
    sdata->shard_lock.Lock();
    if (sdata->pqueue->empty() &&
-     !(is_smallest_thread_index && !sdata->context_queue.empty())) {
+      (!is_smallest_thread_index || sdata->context_queue.empty())) {
      sdata->sdata_wait_lock.Lock();
-    if (!sdata->stop_waiting) {
+    if (is_smallest_thread_index && !sdata->context_queue.empty()) {
+      // we raced with a context_queue addition, don't wait
+      sdata->sdata_wait_lock.Unlock();
+    } else if (!sdata->stop_waiting) {
        dout(20) << __func__ << " empty q, waiting" << dendl;
        osd->cct->get_heartbeat_map()->clear_timeout(hb);
        sdata->shard_lock.Unlock();
author	Sage Weil <sage@redhat.com>
	Thu, 25 Oct 2018 19:24:02 +0000 (14:24 -0500)
committer	Sage Weil <sage@redhat.com>
	Fri, 26 Oct 2018 15:27:09 +0000 (10:27 -0500)