From: Patrick Donnelly Date: Tue, 25 Jul 2023 14:18:12 +0000 (-0400) Subject: qa: check for expected cluster log message X-Git-Tag: v18.2.1~110^2~1 X-Git-Url: http://git-server-git.apps.pok.os.sepia.ceph.com/?a=commitdiff_plain;h=c8f8324ee2fae48e8d3c2bbdbf45cc9ffe46fd4c;p=ceph-ci.git qa: check for expected cluster log message Signed-off-by: Patrick Donnelly (cherry picked from commit ab3cbf17989412aa1a222dd2eecccc2c90afe6e2) Conflicts: qa/tasks/cephfs/test_damage.py: caused by api change --- diff --git a/qa/tasks/cephfs/test_damage.py b/qa/tasks/cephfs/test_damage.py index d83187017e3..bfaa23453b0 100644 --- a/qa/tasks/cephfs/test_damage.py +++ b/qa/tasks/cephfs/test_damage.py @@ -608,8 +608,9 @@ class TestDamage(CephFSTestCase): self.fs.flush() self.config_set("mds", "mds_inject_rename_corrupt_dentry_first", "1.0") time.sleep(5) # for conf to percolate - p = self.mount_a.run_shell_payload("timeout 60 mv a/b a/z", wait=False) - self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(), timeout=self.fs.beacon_timeout) + with self.assert_cluster_log("MDS abort because newly corrupt dentry"): + p = self.mount_a.run_shell_payload("timeout 60 mv a/b a/z", wait=False) + self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(), timeout=self.fs.beacon_timeout) self.config_rm("mds", "mds_inject_rename_corrupt_dentry_first") self.fs.rank_freeze(False, rank=0) self.delete_mds_coredump(rank0['name']) @@ -642,9 +643,10 @@ class TestDamage(CephFSTestCase): rank0 = self.fs.get_rank() self.fs.rank_freeze(True, rank=0) # so now we want to trigger commit but this will crash, so: - c = ['--connect-timeout=60', 'tell', f"mds.{fscid}:0", "flush", "journal"] - p = self.ceph_cluster.mon_manager.run_cluster_cmd(args=c, wait=False, timeoutcmd=30) - self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(), timeout=self.fs.beacon_timeout) + with self.assert_cluster_log("MDS abort because newly corrupt dentry"): + c = ['--connect-timeout=60', 'tell', f"mds.{fscid}:0", "flush", "journal"] + p = self.ceph_cluster.mon_manager.run_cluster_cmd(args=c, wait=False, timeoutcmd=30) + self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(), timeout=self.fs.beacon_timeout) self.config_rm("mds", "mds_inject_journal_corrupt_dentry_first") self.fs.rank_freeze(False, rank=0) self.delete_mds_coredump(rank0['name'])