From: Jason Dillaman Date: Sun, 7 Sep 2014 02:59:40 +0000 (-0400) Subject: Enforce cache size on read requests X-Git-Tag: v0.86~119^2 X-Git-Url: http://git-server-git.apps.pok.os.sepia.ceph.com/?a=commitdiff_plain;h=refs%2Fpull%2F2422%2Fhead;p=ceph.git Enforce cache size on read requests In-flight cache reads were not previously counted against new cache read requests, which could result in very large cache usage. This effect is most noticeable when writing small chunks to a cloned image since each write requires a full object read from the parent. Signed-off-by: Jason Dillaman --- diff --git a/src/osdc/ObjectCacher.cc b/src/osdc/ObjectCacher.cc index e7dfe18bb060..1f58674ec7fa 100644 --- a/src/osdc/ObjectCacher.cc +++ b/src/osdc/ObjectCacher.cc @@ -763,6 +763,9 @@ void ObjectCacher::bh_read_finish(int64_t poolid, sobject_t oid, ceph_tid_t tid, loff_t oldpos = opos; opos = bh->end(); + ls.splice(ls.end(), waitfor_read); + waitfor_read.clear(); + if (r == -ENOENT) { if (trust_enoent) { ldout(cct, 10) << "bh_read_finish removing " << *bh << dendl; @@ -1110,13 +1113,26 @@ int ObjectCacher::_readx(OSDRead *rd, ObjectSet *oset, Context *onfinish, for (map::iterator bh_it = missing.begin(); bh_it != missing.end(); ++bh_it) { - bh_read(bh_it->second); - if (success && onfinish) { - ldout(cct, 10) << "readx missed, waiting on " << *bh_it->second - << " off " << bh_it->first << dendl; - bh_it->second->waitfor_read[bh_it->first].push_back( new C_RetryRead(this, rd, oset, onfinish) ); + loff_t clean = get_stat_clean() + get_stat_rx() + + bh_it->second->length(); + if (get_stat_rx() > 0 && static_cast(clean) > max_size) { + // cache is full -- wait for rx's to complete + ldout(cct, 10) << "readx missed, waiting on cache to free " + << (clean - max_size) << " bytes" << dendl; + if (success) { + waitfor_read.push_back(new C_RetryRead(this, rd, oset, onfinish)); + } + bh_remove(o, bh_it->second); + delete bh_it->second; + } else { + bh_read(bh_it->second); + if (success && onfinish) { + ldout(cct, 10) << "readx missed, waiting on " << *bh_it->second + << " off " << bh_it->first << dendl; + bh_it->second->waitfor_read[bh_it->first].push_back( new C_RetryRead(this, rd, oset, onfinish) ); + } + bytes_not_in_cache += bh_it->second->length(); } - bytes_not_in_cache += bh_it->second->length(); success = false; } diff --git a/src/osdc/ObjectCacher.h b/src/osdc/ObjectCacher.h index ca16138fa2d0..9685ee3838be 100644 --- a/src/osdc/ObjectCacher.h +++ b/src/osdc/ObjectCacher.h @@ -340,6 +340,7 @@ class ObjectCacher { void *flush_set_callback_arg; vector > objects; // indexed by pool_id + list waitfor_read; ceph_tid_t last_read_tid;