qa/tasks/nvmeof.py: Improve thrasher and rbd image creation

author Vallari Agrawal <vallari.agrawal@ibm.com>

Tue, 19 Nov 2024 06:06:09 +0000 (11:36 +0530)

committer Vallari Agrawal <vallari.agrawal@ibm.com>

Tue, 26 Nov 2024 08:11:01 +0000 (13:41 +0530)
author Vallari Agrawal <vallari.agrawal@ibm.com>
Tue, 19 Nov 2024 06:06:09 +0000 (11:36 +0530)
committer Vallari Agrawal <vallari.agrawal@ibm.com>
Tue, 26 Nov 2024 08:11:01 +0000 (13:41 +0530)
diff --git a/qa/suites/nvmeof/thrash/thrashers/nvmeof_thrash.yaml b/qa/suites/nvmeof/thrash/thrashers/nvmeof_thrash.yaml

index 8949e163401fb11bf38c0ec37ada23aea1f1d773..b58dc14d87bd2e17872cb44b3de87718ca237152 100644 (file)
--- a/qa/suites/nvmeof/thrash/thrashers/nvmeof_thrash.yaml
+++ b/qa/suites/nvmeof/thrash/thrashers/nvmeof_thrash.yaml
@@ -13,3 +13,4 @@ overrides:
  tasks:
  - nvmeof.thrash:
      checker_host: 'client.0'
+    randomize: False
diff --git a/qa/tasks/nvmeof.py b/qa/tasks/nvmeof.py

index 5defc710fed39ad07e81cc00a8df49d84ae795a3..c58a7267b4e98d488f4620aa21f650f37bc57499 100644 (file)
--- a/qa/tasks/nvmeof.py
+++ b/qa/tasks/nvmeof.py
@@ -128,12 +128,11 @@ class Nvmeof(Task):
  
              total_images = int(self.namespaces_count) * int(self.subsystems_count)
              log.info(f'[nvmeof]: creating {total_images} images')
+            rbd_create_cmd = []
              for i in range(1, total_images + 1):
                  imagename = self.image_name_prefix + str(i)
-                log.info(f'[nvmeof]: rbd create {poolname}/{imagename} --size {self.rbd_size}')
-                _shell(self.ctx, self.cluster_name, self.remote, [
-                    'rbd', 'create', f'{poolname}/{imagename}', '--size', f'{self.rbd_size}'
-                ])
+                rbd_create_cmd += ['rbd', 'create', f'{poolname}/{imagename}', '--size', f'{self.rbd_size}', run.Raw(';')]           
+            _shell(self.ctx, self.cluster_name, self.remote, rbd_create_cmd)     
  
          for role, i in daemons.items():
              remote, id_ = i
@@ -311,7 +310,7 @@ class NvmeofThrasher(Thrasher, Greenlet):
  
          self.min_thrash_delay = int(self.config.get('min_thrash_delay', 60))
          self.max_thrash_delay = int(self.config.get('max_thrash_delay', self.min_thrash_delay + 30))
-        self.min_revive_delay = int(self.config.get('min_revive_delay', 100))
+        self.min_revive_delay = int(self.config.get('min_revive_delay', 60))
          self.max_revive_delay = int(self.config.get('max_revive_delay', self.min_revive_delay + 30))
  
      def _get_devices(self, remote):
@@ -422,13 +421,11 @@ class NvmeofThrasher(Thrasher, Greenlet):
          while not self.stopping.is_set():
              killed_daemons = defaultdict(list)
  
-            weight = 1.0 / len(self.daemons)
-            count = 0
+            thrash_daemon_num = self.rng.randint(1, self.max_thrash_daemons)
+            selected_daemons = self.rng.sample(self.daemons, thrash_daemon_num)
              for daemon in self.daemons:
-                skip = self.rng.uniform(0.0, 1.0)
-                if weight <= skip:
-                    self.log('skipping daemon {label} with skip ({skip}) > weight ({weight})'.format(
-                        label=daemon.id_, skip=skip, weight=weight))
+                if daemon not in selected_daemons:
+                    self.log(f'skipping daemon {daemon.id_} ...')
                      continue
  
                  # For now, nvmeof daemons can only be thrashed 3 times in last 30mins. 
@@ -446,17 +443,11 @@ class NvmeofThrasher(Thrasher, Greenlet):
                          continue
  
                  self.log('kill {label}'.format(label=daemon.id_))
-                # daemon.stop()
                  kill_method = self.kill_daemon(daemon)
  
                  killed_daemons[kill_method].append(daemon)
                  daemons_thrash_history[daemon.id_] += [datetime.now()]
  
-                # only thrash max_thrash_daemons amount of daemons
-                count += 1
-                if count >= self.max_thrash_daemons:
-                    break
-
              if killed_daemons:
                  iteration_summary = "thrashed- "
                  for kill_method in killed_daemons:
author	Vallari Agrawal <vallari.agrawal@ibm.com>
	Tue, 19 Nov 2024 06:06:09 +0000 (11:36 +0530)
committer	Vallari Agrawal <vallari.agrawal@ibm.com>
	Tue, 26 Nov 2024 08:11:01 +0000 (13:41 +0530)
qa/suites/nvmeof/thrash/thrashers/nvmeof_thrash.yaml		patch \| blob \| history
qa/tasks/nvmeof.py		patch \| blob \| history