From 11fb16df06ad61e228c17feedf00dfb85f0477d5 Mon Sep 17 00:00:00 2001 From: Xiubo Li Date: Sat, 10 Apr 2021 12:52:24 +0800 Subject: [PATCH] client: wait rename to finish In rare case during the rename if another thread tries to lookup the dst dentry, it may get an inconsistent result that both src dentry and dst dentry will link to the same inode at the same time. Will wait the rename to finish and try it again. Fixes: https://tracker.ceph.com/issues/49912 Signed-off-by: Xiubo Li --- src/client/Client.cc | 32 +++++++++++++++++++++++++++++--- src/client/Client.h | 5 ++++- src/client/Dentry.h | 1 + 3 files changed, 34 insertions(+), 4 deletions(-) diff --git a/src/client/Client.cc b/src/client/Client.cc index 83885a980e3..5ee98df02d3 100644 --- a/src/client/Client.cc +++ b/src/client/Client.cc @@ -1210,6 +1210,11 @@ Dentry *Client::insert_dentry_inode(Dir *dir, const string& dname, LeaseStat *dl Inode *diri = dir->parent_inode; clear_dir_complete_and_ordered(diri, false); dn = link(dir, dname, in, dn); + + if (old_dentry) { + dn->is_renaming = false; + signal_cond_list(waiting_for_rename); + } } update_dentry_lease(dn, dlease, from, session); @@ -7129,7 +7134,8 @@ bool Client::_dentry_valid(const Dentry *dn) } int Client::_lookup(Inode *dir, const string& dname, int mask, InodeRef *target, - const UserPerm& perms, std::string* alternate_name) + const UserPerm& perms, std::string* alternate_name, + bool is_rename) { int r = 0; Dentry *dn = NULL; @@ -7208,6 +7214,19 @@ relookup: } else { ldout(cct, 20) << " no cap on " << dn->inode->vino() << dendl; } + + // In rare case during the rename if another thread tries to + // lookup the dst dentry, it may get an inconsistent result + // that both src dentry and dst dentry will link to the same + // inode at the same time. + // Will wait the rename to finish and try it again. + if (!is_rename && dn->is_renaming) { + ldout(cct, 1) << __func__ << " dir " << *dir + << " rename is on the way, will wait for dn '" + << dname << "'" << dendl; + wait_on_list(waiting_for_rename); + goto relookup; + } } else { // can we conclude ENOENT locally? if (dir->caps_issued_mask(CEPH_CAP_FILE_SHARED, true) && @@ -14398,12 +14417,13 @@ int Client::_rename(Inode *fromdir, const char *fromname, Inode *todir, const ch req->old_dentry_drop = CEPH_CAP_FILE_SHARED; req->old_dentry_unless = CEPH_CAP_FILE_EXCL; + de->is_renaming = true; req->set_dentry(de); req->dentry_drop = CEPH_CAP_FILE_SHARED; req->dentry_unless = CEPH_CAP_FILE_EXCL; InodeRef oldin, otherin; - res = _lookup(fromdir, fromname, 0, &oldin, perm); + res = _lookup(fromdir, fromname, 0, &oldin, perm, nullptr, true); if (res < 0) goto fail; @@ -14412,7 +14432,7 @@ int Client::_rename(Inode *fromdir, const char *fromname, Inode *todir, const ch req->set_old_inode(oldinode); req->old_inode_drop = CEPH_CAP_LINK_SHARED; - res = _lookup(todir, toname, 0, &otherin, perm); + res = _lookup(todir, toname, 0, &otherin, perm, nullptr, true); switch (res) { case 0: { @@ -14441,6 +14461,12 @@ int Client::_rename(Inode *fromdir, const char *fromname, Inode *todir, const ch res = make_request(req, perm, &target); ldout(cct, 10) << "rename result is " << res << dendl; + // if rename fails it will miss waking up the waiters + if (op == CEPH_MDS_OP_RENAME && de->is_renaming) { + de->is_renaming = false; + signal_cond_list(waiting_for_rename); + } + // renamed item from our cache trim_cache(); diff --git a/src/client/Client.h b/src/client/Client.h index 9a0b15993d7..911a8b460df 100644 --- a/src/client/Client.h +++ b/src/client/Client.h @@ -1341,7 +1341,8 @@ private: const UserPerm& perms); int _lookup(Inode *dir, const std::string& dname, int mask, InodeRef *target, - const UserPerm& perm, std::string* alternate_name=nullptr); + const UserPerm& perm, std::string* alternate_name=nullptr, + bool is_rename=false); int _link(Inode *in, Inode *dir, const char *name, const UserPerm& perm, std::string alternate_name, InodeRef *inp = 0); @@ -1594,6 +1595,8 @@ private: std::map, int> pool_perms; std::list waiting_for_pool_perm; + std::list waiting_for_rename; + uint64_t retries_on_invalidate = 0; // state reclaim diff --git a/src/client/Dentry.h b/src/client/Dentry.h index 94722c5de70..8003dfed34b 100644 --- a/src/client/Dentry.h +++ b/src/client/Dentry.h @@ -91,6 +91,7 @@ public: ceph_seq_t lease_seq = 0; int cap_shared_gen = 0; std::string alternate_name; + bool is_renaming = false; private: xlist::item inode_xlist_link; -- 2.39.5