qa/standalone/scrub: Force a subset of scrub tests to use "wpq" scheduler

author Sridhar Seshasayee <sseshasa@redhat.com>

Mon, 21 Jun 2021 12:47:32 +0000 (18:17 +0530)

committer Sridhar Seshasayee <sseshasa@redhat.com>

Fri, 30 Jul 2021 12:46:00 +0000 (18:16 +0530)
author Sridhar Seshasayee <sseshasa@redhat.com>
Mon, 21 Jun 2021 12:47:32 +0000 (18:17 +0530)
committer Sridhar Seshasayee <sseshasa@redhat.com>
Fri, 30 Jul 2021 12:46:00 +0000 (18:16 +0530)
diff --git a/qa/standalone/scrub/osd-scrub-dump.sh b/qa/standalone/scrub/osd-scrub-dump.sh

index 6d18d6a60f3e28580c709d40fb65e5714af61da5..092e4ef6eadc4d6f53c624ec3bd68d49525090fe 100755 (executable)
--- a/qa/standalone/scrub/osd-scrub-dump.sh
+++ b/qa/standalone/scrub/osd-scrub-dump.sh
@@ -24,7 +24,6 @@ POOL_SIZE=3
  function run() {
      local dir=$1
      shift
-    local SLEEP=0
      local CHUNK_MAX=5
  
      export CEPH_MON="127.0.0.1:7184" # git grep '\<7184\>' : there must be only one
@@ -32,10 +31,13 @@ function run() {
      CEPH_ARGS+="--fsid=$(uuidgen) --auth-supported=none "
      CEPH_ARGS+="--mon-host=$CEPH_MON "
      CEPH_ARGS+="--osd_max_scrubs=$MAX_SCRUBS "
-    CEPH_ARGS+="--osd_scrub_sleep=$SLEEP "
      CEPH_ARGS+="--osd_scrub_chunk_max=$CHUNK_MAX "
      CEPH_ARGS+="--osd_scrub_sleep=$SCRUB_SLEEP "
      CEPH_ARGS+="--osd_pool_default_size=$POOL_SIZE "
+    # Set scheduler to "wpq" until there's a reliable way to query scrub states
+    # with "--osd-scrub-sleep" set to 0. The "mclock_scheduler" overrides the
+    # scrub sleep to 0 and as a result the checks in the test fail.
+    CEPH_ARGS+="--osd_op_queue=wpq "
  
      export -n CEPH_CLI_TEST_DUP_COMMAND
      local funcs=${@:-$(set | sed -n -e 's/^\(TEST_[0-9a-z_]*\) .*/\1/p')}
@@ -91,10 +93,9 @@ function TEST_recover_unexpected() {
      ceph pg dump pgs
  
      max=$(CEPH_ARGS='' ceph daemon $(get_asok_path osd.0) dump_scrub_reservations | jq '.osd_max_scrubs')
-    if [ $max != $MAX_SCRUBS];
-    then
-       echo "ERROR: Incorrect osd_max_scrubs from dump_scrub_reservations"
-       return 1
+    if [ $max != $MAX_SCRUBS ]; then
+        echo "ERROR: Incorrect osd_max_scrubs from dump_scrub_reservations"
+        return 1
      fi
  
      ceph osd unset noscrub
diff --git a/qa/standalone/scrub/osd-scrub-repair.sh b/qa/standalone/scrub/osd-scrub-repair.sh

index 3e56a2f9b1471cdeb912d9a9e86bd3709e6d1858..625d976a7cf7ad1e85113a36aeed15e50780fe8d 100755 (executable)
--- a/qa/standalone/scrub/osd-scrub-repair.sh
+++ b/qa/standalone/scrub/osd-scrub-repair.sh
@@ -390,9 +390,13 @@ function TEST_auto_repair_bluestore_tag() {
      # Launch a cluster with 3 seconds scrub interval
      run_mon $dir a || return 1
      run_mgr $dir x || return 1
+    # Set scheduler to "wpq" until there's a reliable way to query scrub states
+    # with "--osd-scrub-sleep" set to 0. The "mclock_scheduler" overrides the
+    # scrub sleep to 0 and as a result the checks in the test fail.
      local ceph_osd_args="--osd-scrub-auto-repair=true \
              --osd_deep_scrub_randomize_ratio=0 \
-            --osd-scrub-interval-randomize-ratio=0"
+            --osd-scrub-interval-randomize-ratio=0 \
+            --osd-op-queue=wpq"
      for id in $(seq 0 2) ; do
          run_osd $dir $id $ceph_osd_args || return 1
      done
diff --git a/qa/standalone/scrub/osd-scrub-test.sh b/qa/standalone/scrub/osd-scrub-test.sh

index 5dd029c356fe196f6b22f3223d555742bb626c4f..6cea0b8fcf8321b4582e790618d981f186243cff 100755 (executable)
--- a/qa/standalone/scrub/osd-scrub-test.sh
+++ b/qa/standalone/scrub/osd-scrub-test.sh
@@ -301,10 +301,15 @@ function _scrub_abort() {
      run_mgr $dir x || return 1
      for osd in $(seq 0 $(expr $OSDS - 1))
      do
-      run_osd $dir $osd --osd_pool_default_pg_autoscale_mode=off \
-             --osd_deep_scrub_randomize_ratio=0.0 \
-             --osd_scrub_sleep=5.0 \
-             --osd_scrub_interval_randomize_ratio=0  || return 1
+        # Set scheduler to "wpq" until there's a reliable way to query scrub
+        # states with "--osd-scrub-sleep" set to 0. The "mclock_scheduler"
+        # overrides the scrub sleep to 0 and as a result the checks in the
+        # test fail.
+        run_osd $dir $osd --osd_pool_default_pg_autoscale_mode=off \
+            --osd_deep_scrub_randomize_ratio=0.0 \
+            --osd_scrub_sleep=5.0 \
+            --osd_scrub_interval_randomize_ratio=0 \
+            --osd_op_queue=wpq || return 1
      done
  
      # Create a pool with a single pg
author	Sridhar Seshasayee <sseshasa@redhat.com>
	Mon, 21 Jun 2021 12:47:32 +0000 (18:17 +0530)
committer	Sridhar Seshasayee <sseshasa@redhat.com>
	Fri, 30 Jul 2021 12:46:00 +0000 (18:16 +0530)
qa/standalone/scrub/osd-scrub-dump.sh		patch \| blob \| history
qa/standalone/scrub/osd-scrub-repair.sh		patch \| blob \| history
qa/standalone/scrub/osd-scrub-test.sh		patch \| blob \| history