task: scrub OSDs periodically

author Mike Ryan <mike.ryan@inktank.com>

Wed, 1 Aug 2012 22:35:38 +0000 (15:35 -0700)

committer Mike Ryan <mike.ryan@inktank.com>

Thu, 2 Aug 2012 18:14:51 +0000 (11:14 -0700)
author Mike Ryan <mike.ryan@inktank.com>
Wed, 1 Aug 2012 22:35:38 +0000 (15:35 -0700)
committer Mike Ryan <mike.ryan@inktank.com>
Thu, 2 Aug 2012 18:14:51 +0000 (11:14 -0700)
diff --git a/teuthology/task/scrub.py b/teuthology/task/scrub.py

new file mode 100644 (file)

index 0000000..c1401de
--- /dev/null
+++ b/teuthology/task/scrub.py
@@ -0,0 +1,105 @@
+import contextlib
+import gevent
+import logging
+import random
+import time
+
+import ceph_manager
+from teuthology import misc as teuthology
+
+log = logging.getLogger(__name__)
+
+@contextlib.contextmanager
+def task(ctx, config):
+    """
+    Run scrub periodically. Randomly chooses an OSD to scrub.
+
+    The config should be as follows:
+
+    scrub:
+        frequency: <seconds between scrubs>
+        deep: <bool for deepness>
+
+    example:
+
+    tasks:
+    - ceph:
+    - scrub:
+        frequency: 30
+        deep: 0
+    """
+    if config is None:
+        config = {}
+    assert isinstance(config, dict), \
+        'scrub task only accepts a dict for configuration'
+
+    log.info('Beginning scrub...')
+
+    first_mon = teuthology.get_first_mon(ctx, config)
+    (mon,) = ctx.cluster.only(first_mon).remotes.iterkeys()
+
+    manager = ceph_manager.CephManager(
+        mon,
+        ctx=ctx,
+        logger=log.getChild('ceph_manager'),
+        )
+
+    num_osds = teuthology.num_instances_of_type(ctx.cluster, 'osd')
+    while len(manager.get_osd_status()['up']) < num_osds:
+        manager.sleep(10)
+
+    scrub_proc = Scrubber(
+        manager,
+        config,
+        )
+    try:
+        yield
+    finally:
+        log.info('joining scrub')
+        scrub_proc.do_join()
+
+class Scrubber:
+    def __init__(self, manager, config):
+        self.ceph_manager = manager
+        self.ceph_manager.wait_for_clean()
+
+        osd_status = self.ceph_manager.get_osd_status()
+        self.osds = osd_status['up']
+
+        self.config = config
+        if self.config is None:
+            self.config = dict()
+
+        else:
+            def tmp(x):
+                print x
+            self.log = tmp
+
+        self.stopping = False
+
+        log.info("spawning thread")
+
+        self.thread = gevent.spawn(self.do_scrub)
+
+    def do_join(self):
+        self.stopping = True
+        self.thread.get()
+
+    def do_scrub(self):
+        frequency = self.config.get("frequency", 30)
+        deep = self.config.get("deep", 0)
+
+        log.info("stopping %s" % self.stopping)
+
+        while not self.stopping:
+            osd = str(random.choice(self.osds))
+
+            if deep:
+                cmd = 'deep-scrub'
+            else:
+                cmd = 'scrub'
+
+            log.info('%sbing %s' % (cmd, osd))
+            self.ceph_manager.raw_cluster_cmd('osd', cmd, osd)
+
+            time.sleep(frequency)
author	Mike Ryan <mike.ryan@inktank.com>
	Wed, 1 Aug 2012 22:35:38 +0000 (15:35 -0700)
committer	Mike Ryan <mike.ryan@inktank.com>
	Thu, 2 Aug 2012 18:14:51 +0000 (11:14 -0700)