client: op cancellation on per pool full flag

author John Spray <john.spray@redhat.com>

Tue, 31 Mar 2015 12:21:43 +0000 (13:21 +0100)

committer John Spray <john.spray@redhat.com>

Tue, 12 May 2015 09:20:41 +0000 (10:20 +0100)
author John Spray <john.spray@redhat.com>
Tue, 31 Mar 2015 12:21:43 +0000 (13:21 +0100)
committer John Spray <john.spray@redhat.com>
Tue, 12 May 2015 09:20:41 +0000 (10:20 +0100)
diff --git a/src/client/Client.cc b/src/client/Client.cc

index 063958f0c3b92f8dda9eb789d27a9a06e9452460..c9b3c8909a0e11bb7dbfbe09e8423002c8fc4420 100644 (file)
--- a/src/client/Client.cc
+++ b/src/client/Client.cc
@@ -2091,37 +2091,66 @@ void Client::handle_client_reply(MClientReply *reply)
      mount_cond.Signal();
  }
  
+void Client::_handle_full_flag(int64_t pool)
+{
+  ldout(cct, 1) << __func__ << ": FULL: cancelling outstanding operations "
+    << "on " << pool << dendl;
+  // Cancel all outstanding ops with -ENOSPC: it is necessary to do this rather
+  // than blocking, because otherwise when we fill up we potentially lock caps
+  // forever on files with dirty pages, and we need to be able to release
+  // those caps to the MDS so that it can delete files and free up space.
+  epoch_t cancelled_epoch = objecter->op_cancel_writes(-ENOSPC, pool);
+
+  // For all inodes with a pending flush write op (i.e. one of the ones we
+  // will cancel), we've got to purge_set their data from ObjectCacher
+  // so that it doesn't re-issue the write in response to the ENOSPC error.
+  // Fortunately since we're cancelling *everything*, we don't need to know
+  // which ops belong to which ObjectSet, we can just blow all the un-flushed
+  // cached data away and mark any dirty inodes' async_err field with -ENOSPC
+  // (i.e. we only need to know which inodes had outstanding ops, not the exact
+  // op-to-inode relation)
+  for (unordered_map<vinodeno_t,Inode*>::iterator i = inode_map.begin();
+       i != inode_map.end(); ++i)
+  {
+    Inode *inode = i->second;
+    if (inode->oset.dirty_or_tx
+        && (pool == -1 || inode->layout.fl_pg_pool == pool)) {
+      ldout(cct, 4) << __func__ << ": FULL: inode 0x" << std::hex << i->first << std::dec
+        << " has dirty objects, purging and setting ENOSPC" << dendl;
+      objectcacher->purge_set(&inode->oset);
+      inode->async_err = -ENOSPC;
+    }
+  }
+
+  if (cancelled_epoch != (epoch_t)-1) {
+    set_cap_epoch_barrier(cancelled_epoch);
+  }
+}
+
  void Client::handle_osd_map(MOSDMap *m)
  {
    if (objecter->osdmap_full_flag()) {
-    ldout(cct, 1) << __func__ << ": FULL: cancelling outstanding operations" << dendl;
-    // Cancel all outstanding ops with -ENOSPC: it is necessary to do this rather than blocking,
-    // because otherwise when we fill up we potentially lock caps forever on files with
-    // dirty pages, and we need to be able to release those caps to the MDS so that it can
-    // delete files and free up space.
-    epoch_t cancelled_epoch = objecter->op_cancel_writes(-ENOSPC);
-
-    // For all inodes with a pending flush write op (i.e. one of the ones we
-    // will cancel), we've got to purge_set their data from ObjectCacher
-    // so that it doesn't re-issue the write in response to the ENOSPC error.
-    // Fortunately since we're cancelling *everything*, we don't need to know
-    // which ops belong to which ObjectSet, we can just blow all the un-flushed
-    // cached data away and mark any dirty inodes' async_err field with -ENOSPC
-    // (i.e. we only need to know which inodes had outstanding ops, not the exact
-    // op-to-inode relation)
-    for (unordered_map<vinodeno_t,Inode*>::iterator i = inode_map.begin();
-         i != inode_map.end(); ++i)
-    {
-      Inode *inode = i->second;
-      if (inode->oset.dirty_or_tx) {
-        ldout(cct, 4) << __func__ << ": FULL: inode 0x" << std::hex << i->first << std::dec
-          << " has dirty objects, purging and setting ENOSPC" << dendl;
-        objectcacher->purge_set(&inode->oset);
-        inode->async_err = -ENOSPC;
+    _handle_full_flag(-1);
+  } else {
+    // Accumulate local list of full pools so that I can drop
+    // the OSDMap lock before handling them.
+    std::vector<int64_t> full_pools;
+
+    const OSDMap *osd_map = objecter->get_osdmap_read();
+    const map<int64_t,pg_pool_t>& pools = osd_map->get_pools();
+    for (map<int64_t,pg_pool_t>::const_iterator i = pools.begin();
+         i != pools.end(); ++i) {
+      if (i->second.has_flag(pg_pool_t::FLAG_FULL)) {
+        full_pools.push_back(i->first);
        }
      }
  
-    set_cap_epoch_barrier(cancelled_epoch);
+    objecter->put_osdmap_read();
+
+    for (std::vector<int64_t>::iterator i = full_pools.begin();
+         i != full_pools.end(); ++i) {
+      _handle_full_flag(*i);
+    }
    }
  
    m->put();
diff --git a/src/client/Client.h b/src/client/Client.h

index 4430e565faca747558e74bcf76e6350f81bed79f..6aaffa6cce6c32debbeac6f0110184e34bfdc03f 100644 (file)
--- a/src/client/Client.h
+++ b/src/client/Client.h
@@ -482,6 +482,14 @@ protected:
    list<Cond*> waiting_for_pool_perm;
    int check_pool_perm(Inode *in, int need);
  
+  /**
+   * Call this when an OSDMap is seen with a full flag (global or per pool)
+   * set.
+   *
+   * @param pool the pool ID affected, or -1 if all.
+   */
+  void _handle_full_flag(int64_t pool);
+
   public:
    void set_filer_flags(int flags);
    void clear_filer_flags(int flags);
author	John Spray <john.spray@redhat.com>
	Tue, 31 Mar 2015 12:21:43 +0000 (13:21 +0100)
committer	John Spray <john.spray@redhat.com>
	Tue, 12 May 2015 09:20:41 +0000 (10:20 +0100)
src/client/Client.cc		patch \| blob \| history
src/client/Client.h		patch \| blob \| history