osd: drop writes when full instead of returning an error

author Josh Durgin <josh.durgin@inktank.com>

Fri, 6 Dec 2013 01:34:38 +0000 (17:34 -0800)

committer Sage Weil <sage@inktank.com>

Mon, 30 Dec 2013 16:49:21 +0000 (08:49 -0800)
author Josh Durgin <josh.durgin@inktank.com>
Fri, 6 Dec 2013 01:34:38 +0000 (17:34 -0800)
committer Sage Weil <sage@inktank.com>
Mon, 30 Dec 2013 16:49:21 +0000 (08:49 -0800)
diff --git a/src/osd/OSD.cc b/src/osd/OSD.cc

index 92904527f83e3d708bf9f4c6ed778e11ea99c25c..350bc49da0e6398eb3da12ac59f9e93497dd58bf 100644 (file)
--- a/src/osd/OSD.cc
+++ b/src/osd/OSD.cc
@@ -4992,6 +4992,7 @@ void OSD::handle_osd_map(MOSDMap *m)
    ObjectStore::Transaction &t = *_t;
  
    // store new maps: queue for disk and put in the osdmap cache
+  epoch_t last_marked_full = 0;
    epoch_t start = MAX(osdmap->get_epoch() + 1, first);
    for (epoch_t e = start; e <= last; e++) {
      map<epoch_t,bufferlist>::iterator p;
@@ -5002,6 +5003,8 @@ void OSD::handle_osd_map(MOSDMap *m)
        bufferlist& bl = p->second;
        
        o->decode(bl);
+      if (o->test_flag(CEPH_OSDMAP_FULL))
+       last_marked_full = e;
        pinned_maps.push_back(add_map(o));
  
        hobject_t fulloid = get_osdmap_pobject_name(e);
@@ -5034,6 +5037,8 @@ void OSD::handle_osd_map(MOSDMap *m)
         assert(0 == "bad fsid");
        }
  
+      if (o->test_flag(CEPH_OSDMAP_FULL))
+       last_marked_full = e;
        pinned_maps.push_back(add_map(o));
  
        bufferlist fbl;
@@ -5069,6 +5074,8 @@ void OSD::handle_osd_map(MOSDMap *m)
      superblock.oldest_map = first;
    superblock.newest_map = last;
  
+  if (last_marked_full > superblock.last_map_marked_full)
+    superblock.last_map_marked_full = last_marked_full;
   
    map_lock.get_write();
  
@@ -6876,9 +6883,11 @@ void OSD::handle_op(OpRequestRef op)
    if (op->may_write()) {
      // full?
      if ((service.check_failsafe_full() ||
-                 osdmap->test_flag(CEPH_OSDMAP_FULL)) &&
+        osdmap->test_flag(CEPH_OSDMAP_FULL) ||
+        m->get_map_epoch() < superblock.last_map_marked_full) &&
         !m->get_source().is_mds()) {  // FIXME: we'll exclude mds writes for now.
-      service.reply_op_error(op, -ENOSPC);
+      // Drop the request, since the client will retry when the full
+      // flag is unset.
        return;
      }
  
diff --git a/src/osd/osd_types.cc b/src/osd/osd_types.cc

index ea3e5d5c3ebde95bf5836cde3ab01786d3623827..d944df69120060734a95400d4ef59ac14d844289 100644 (file)
--- a/src/osd/osd_types.cc
+++ b/src/osd/osd_types.cc
@@ -2441,7 +2441,7 @@ ostream& operator<<(ostream& out, const osd_peer_stat_t &stat)
  
  void OSDSuperblock::encode(bufferlist &bl) const
  {
-  ENCODE_START(5, 5, bl);
+  ENCODE_START(6, 5, bl);
    ::encode(cluster_fsid, bl);
    ::encode(whoami, bl);
    ::encode(current_epoch, bl);
@@ -2452,12 +2452,13 @@ void OSDSuperblock::encode(bufferlist &bl) const
    ::encode(clean_thru, bl);
    ::encode(mounted, bl);
    ::encode(osd_fsid, bl);
+  ::encode(last_map_marked_full, bl);
    ENCODE_FINISH(bl);
  }
  
  void OSDSuperblock::decode(bufferlist::iterator &bl)
  {
-  DECODE_START_LEGACY_COMPAT_LEN(5, 5, 5, bl);
+  DECODE_START_LEGACY_COMPAT_LEN(6, 5, 5, bl);
    if (struct_v < 3) {
      string magic;
      ::decode(magic, bl);
@@ -2477,6 +2478,8 @@ void OSDSuperblock::decode(bufferlist::iterator &bl)
    ::decode(mounted, bl);
    if (struct_v >= 4)
      ::decode(osd_fsid, bl);
+  if (struct_v >= 6)
+    ::decode(last_map_marked_full, bl);
    DECODE_FINISH(bl);
  }
  
@@ -2494,6 +2497,7 @@ void OSDSuperblock::dump(Formatter *f) const
    f->close_section();
    f->dump_int("clean_thru", clean_thru);
    f->dump_int("last_epoch_mounted", mounted);
+  f->dump_int("last_map_marked_full", last_map_marked_full);
  }
  
  void OSDSuperblock::generate_test_instances(list<OSDSuperblock*>& o)
@@ -2509,6 +2513,8 @@ void OSDSuperblock::generate_test_instances(list<OSDSuperblock*>& o)
    z.mounted = 8;
    z.clean_thru = 7;
    o.push_back(new OSDSuperblock(z));
+  z.last_map_marked_full = 7;
+  o.push_back(new OSDSuperblock(z));
  }
  
  // -- SnapSet --
diff --git a/src/osd/osd_types.h b/src/osd/osd_types.h

index 5b789502d7eff3d2eade178b694b315586ba882a..5f89d0b388d5d5704eb3ab07e6553b5767812529 100644 (file)
--- a/src/osd/osd_types.h
+++ b/src/osd/osd_types.h
@@ -1846,11 +1846,12 @@ public:
    // last interval over which i mounted and was then active
    epoch_t mounted;     // last epoch i mounted
    epoch_t clean_thru;  // epoch i was active and clean thru
+  epoch_t last_map_marked_full; // last epoch osdmap was marked full
  
    OSDSuperblock() : 
      whoami(-1), 
      current_epoch(0), oldest_map(0), newest_map(0), weight(0),
-    mounted(0), clean_thru(0) {
+    mounted(0), clean_thru(0), last_map_marked_full(0) {
    }
  
    void encode(bufferlist &bl) const;
author	Josh Durgin <josh.durgin@inktank.com>
	Fri, 6 Dec 2013 01:34:38 +0000 (17:34 -0800)
committer	Sage Weil <sage@inktank.com>
	Mon, 30 Dec 2013 16:49:21 +0000 (08:49 -0800)
src/osd/OSD.cc		patch \| blob \| history
src/osd/osd_types.cc		patch \| blob \| history
src/osd/osd_types.h		patch \| blob \| history