]> git.apps.os.sepia.ceph.com Git - ceph.git/commitdiff
qa: reorganize mgr unit tests
authorPatrick Donnelly <pdonnell@redhat.com>
Tue, 23 Apr 2024 14:39:10 +0000 (10:39 -0400)
committerPatrick Donnelly <pdonnell@redhat.com>
Mon, 29 Apr 2024 16:22:27 +0000 (12:22 -0400)
Refactor common tasks and allow loading mgrmodules before unittests start.

Signed-off-by: Patrick Donnelly <pdonnell@redhat.com>
21 files changed:
qa/suites/rados/mgr/tasks/% [new file with mode: 0644]
qa/suites/rados/mgr/tasks/1-install.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/2-ceph.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/3-mgrmodules.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/4-units/.qa [new symlink]
qa/suites/rados/mgr/tasks/4-units/crash.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/4-units/failover.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/4-units/insights.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/4-units/module_selftest.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/4-units/per_module_finisher_stats.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/4-units/progress.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/4-units/prometheus.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/4-units/workunits.yaml [new file with mode: 0644]
qa/suites/rados/mgr/tasks/crash.yaml [deleted file]
qa/suites/rados/mgr/tasks/failover.yaml [deleted file]
qa/suites/rados/mgr/tasks/insights.yaml [deleted file]
qa/suites/rados/mgr/tasks/module_selftest.yaml [deleted file]
qa/suites/rados/mgr/tasks/per_module_finisher_stats.yaml [deleted file]
qa/suites/rados/mgr/tasks/progress.yaml [deleted file]
qa/suites/rados/mgr/tasks/prometheus.yaml [deleted file]
qa/suites/rados/mgr/tasks/workunits.yaml [deleted file]

diff --git a/qa/suites/rados/mgr/tasks/% b/qa/suites/rados/mgr/tasks/%
new file mode 100644 (file)
index 0000000..e69de29
diff --git a/qa/suites/rados/mgr/tasks/1-install.yaml b/qa/suites/rados/mgr/tasks/1-install.yaml
new file mode 100644 (file)
index 0000000..6c48c52
--- /dev/null
@@ -0,0 +1,2 @@
+tasks:
+  - install:
diff --git a/qa/suites/rados/mgr/tasks/2-ceph.yaml b/qa/suites/rados/mgr/tasks/2-ceph.yaml
new file mode 100644 (file)
index 0000000..7aa9eef
--- /dev/null
@@ -0,0 +1,12 @@
+tasks:
+  - ceph:
+      # tests may leave mgrs broken, so don't try and call into them
+      # to invoke e.g. pg dump during teardown.
+      wait-for-scrub: false
+      log-ignorelist:
+        - overall HEALTH_
+        - \(MGR_DOWN\)
+        - \(PG_
+        - replacing it with standby
+        - No standby daemons available
+        - \(POOL_APP_NOT_ENABLED\)
diff --git a/qa/suites/rados/mgr/tasks/3-mgrmodules.yaml b/qa/suites/rados/mgr/tasks/3-mgrmodules.yaml
new file mode 100644 (file)
index 0000000..c437c60
--- /dev/null
@@ -0,0 +1,8 @@
+mgrmodules:
+  sequential:
+    - print: "Enabling mgr modules"
+    # other fragments append to this
+
+tasks:
+  - sequential:
+      - mgrmodules
diff --git a/qa/suites/rados/mgr/tasks/4-units/.qa b/qa/suites/rados/mgr/tasks/4-units/.qa
new file mode 120000 (symlink)
index 0000000..fea2489
--- /dev/null
@@ -0,0 +1 @@
+../.qa
\ No newline at end of file
diff --git a/qa/suites/rados/mgr/tasks/4-units/crash.yaml b/qa/suites/rados/mgr/tasks/4-units/crash.yaml
new file mode 100644 (file)
index 0000000..5d2ab70
--- /dev/null
@@ -0,0 +1,9 @@
+overrides:
+  ceph:
+    log-ignorelist:
+      - \(RECENT_CRASH\)
+
+tasks:
+  - cephfs_test_runner:
+      modules:
+        - tasks.mgr.test_crash
diff --git a/qa/suites/rados/mgr/tasks/4-units/failover.yaml b/qa/suites/rados/mgr/tasks/4-units/failover.yaml
new file mode 100644 (file)
index 0000000..e54d7a1
--- /dev/null
@@ -0,0 +1,4 @@
+tasks:
+  - cephfs_test_runner:
+      modules:
+        - tasks.mgr.test_failover
diff --git a/qa/suites/rados/mgr/tasks/4-units/insights.yaml b/qa/suites/rados/mgr/tasks/4-units/insights.yaml
new file mode 100644 (file)
index 0000000..bb1252e
--- /dev/null
@@ -0,0 +1,14 @@
+overrides:
+  ceph:
+    # tests may leave mgrs broken, so don't try and call into them
+    # to invoke e.g. pg dump during teardown.
+    wait-for-scrub: false
+    log-ignorelist:
+      - \(MGR_INSIGHTS_WARNING\)
+      - \(insights_health_check
+      - \(RECENT_CRASH\)
+
+tasks:
+  - cephfs_test_runner:
+      modules:
+        - tasks.mgr.test_insights
diff --git a/qa/suites/rados/mgr/tasks/4-units/module_selftest.yaml b/qa/suites/rados/mgr/tasks/4-units/module_selftest.yaml
new file mode 100644 (file)
index 0000000..1eb4a18
--- /dev/null
@@ -0,0 +1,18 @@
+overrides:
+  ceph:
+    log-ignorelist:
+      - Reduced data availability
+      - Degraded data redundancy
+      - objects misplaced
+      - Synthetic exception in serve
+      - influxdb python module not found
+      - \(MGR_ZABBIX_
+      - foo bar
+      - Failed to open Telegraf
+      - evicting unresponsive client
+      - 1 mgr modules have recently crashed \(RECENT_MGR_MODULE_CRASH\)
+tasks:
+  - cephfs_test_runner:
+      modules:
+        - tasks.mgr.test_module_selftest
+      fail_on_skip: false
diff --git a/qa/suites/rados/mgr/tasks/4-units/per_module_finisher_stats.yaml b/qa/suites/rados/mgr/tasks/4-units/per_module_finisher_stats.yaml
new file mode 100644 (file)
index 0000000..e990e62
--- /dev/null
@@ -0,0 +1,41 @@
+overrides:
+  check-counter:
+    counters:
+      mgr:
+          - name: "finisher-balancer.complete_latency.avgcount"
+            min: 1
+          - name: "finisher-balancer.queue_len"
+            expected_val: 0
+          - name: "finisher-crash.complete_latency.avgcount"
+            min: 2
+          - name: "finisher-crash.queue_len"
+            expected_val: 0
+          - name: "finisher-devicehealth.complete_latency.avgcount"
+            min: 1
+          - name: "finisher-devicehealth.queue_len"
+            expected_val: 0
+          - name: "finisher-iostat.complete_latency.avgcount"
+            min: 1
+          - name: "finisher-iostat.queue_len"
+            expected_val: 0
+          - name: "finisher-pg_autoscaler.complete_latency.avgcount"
+            min: 1
+          - name: "finisher-pg_autoscaler.queue_len"
+            expected_val: 0
+          - name: "finisher-progress.complete_latency.avgcount"
+            min: 2
+          - name: "finisher-progress.queue_len"
+            expected_val: 0
+          - name: "finisher-status.complete_latency.avgcount"
+            min: 2
+          - name: "finisher-status.queue_len"
+            expected_val: 0
+          - name: "finisher-telemetry.complete_latency.avgcount"
+            min: 2
+          - name: "finisher-telemetry.queue_len"
+            expected_val: 0
+tasks:
+  - workunit:
+      clients:
+        client.0:
+          - mgr/test_per_module_finisher.sh
diff --git a/qa/suites/rados/mgr/tasks/4-units/progress.yaml b/qa/suites/rados/mgr/tasks/4-units/progress.yaml
new file mode 100644 (file)
index 0000000..6ed4f44
--- /dev/null
@@ -0,0 +1,18 @@
+overrides:
+  ceph:
+    conf:
+      osd:
+        osd mclock profile: high_recovery_ops
+      global:
+        osd pool default size : 3
+        osd pool default min size : 2
+    log-ignorelist:
+      - \(MDS_ALL_DOWN\)
+      - \(MDS_UP_LESS_THAN_MAX\)
+      - \(FS_WITH_FAILED_MDS\)
+      - \(FS_DEGRADED\)
+      - \(OSDMAP_FLAGS\)
+tasks:
+  - cephfs_test_runner:
+      modules:
+        - tasks.mgr.test_progress
diff --git a/qa/suites/rados/mgr/tasks/4-units/prometheus.yaml b/qa/suites/rados/mgr/tasks/4-units/prometheus.yaml
new file mode 100644 (file)
index 0000000..f639e16
--- /dev/null
@@ -0,0 +1,4 @@
+tasks:
+  - cephfs_test_runner:
+      modules:
+        - tasks.mgr.test_prometheus
diff --git a/qa/suites/rados/mgr/tasks/4-units/workunits.yaml b/qa/suites/rados/mgr/tasks/4-units/workunits.yaml
new file mode 100644 (file)
index 0000000..21855b1
--- /dev/null
@@ -0,0 +1,5 @@
+tasks:
+  - workunit:
+      clients:
+        client.0:
+          - mgr/test_localpool.sh
diff --git a/qa/suites/rados/mgr/tasks/crash.yaml b/qa/suites/rados/mgr/tasks/crash.yaml
deleted file mode 100644 (file)
index 9d2ba53..0000000
+++ /dev/null
@@ -1,18 +0,0 @@
-
-tasks:
-  - install:
-  - ceph:
-      # tests may leave mgrs broken, so don't try and call into them
-      # to invoke e.g. pg dump during teardown.
-      wait-for-scrub: false
-      log-ignorelist:
-        - overall HEALTH_
-        - \(MGR_DOWN\)
-        - \(PG_
-        - \(RECENT_CRASH\)
-        - replacing it with standby
-        - No standby daemons available
-        - \(POOL_APP_NOT_ENABLED\)
-  - cephfs_test_runner:
-      modules:
-        - tasks.mgr.test_crash
diff --git a/qa/suites/rados/mgr/tasks/failover.yaml b/qa/suites/rados/mgr/tasks/failover.yaml
deleted file mode 100644 (file)
index 6d1e0d5..0000000
+++ /dev/null
@@ -1,17 +0,0 @@
-
-tasks:
-  - install:
-  - ceph:
-      # tests may leave mgrs broken, so don't try and call into them
-      # to invoke e.g. pg dump during teardown.
-      wait-for-scrub: false
-      log-ignorelist:
-        - overall HEALTH_
-        - \(MGR_DOWN\)
-        - \(PG_
-        - replacing it with standby
-        - No standby daemons available
-        - \(POOL_APP_NOT_ENABLED\)
-  - cephfs_test_runner:
-      modules:
-        - tasks.mgr.test_failover
diff --git a/qa/suites/rados/mgr/tasks/insights.yaml b/qa/suites/rados/mgr/tasks/insights.yaml
deleted file mode 100644 (file)
index f7c82cf..0000000
+++ /dev/null
@@ -1,20 +0,0 @@
-
-tasks:
-  - install:
-  - ceph:
-      # tests may leave mgrs broken, so don't try and call into them
-      # to invoke e.g. pg dump during teardown.
-      wait-for-scrub: false
-      log-ignorelist:
-        - overall HEALTH_
-        - \(MGR_DOWN\)
-        - \(MGR_INSIGHTS_WARNING\)
-        - \(insights_health_check
-        - \(PG_
-        - \(RECENT_CRASH\)
-        - replacing it with standby
-        - No standby daemons available
-        - \(POOL_APP_NOT_ENABLED\)
-  - cephfs_test_runner:
-      modules:
-        - tasks.mgr.test_insights
diff --git a/qa/suites/rados/mgr/tasks/module_selftest.yaml b/qa/suites/rados/mgr/tasks/module_selftest.yaml
deleted file mode 100644 (file)
index 4403d9f..0000000
+++ /dev/null
@@ -1,28 +0,0 @@
-
-tasks:
-  - install:
-  - ceph:
-      # tests may leave mgrs broken, so don't try and call into them
-      # to invoke e.g. pg dump during teardown.
-      wait-for-scrub: false
-      log-ignorelist:
-        - overall HEALTH_
-        - \(MGR_DOWN\)
-        - \(PG_
-        - replacing it with standby
-        - No standby daemons available
-        - Reduced data availability
-        - Degraded data redundancy
-        - objects misplaced
-        - Synthetic exception in serve
-        - influxdb python module not found
-        - \(MGR_ZABBIX_
-        - foo bar
-        - Failed to open Telegraf
-        - evicting unresponsive client
-        - 1 mgr modules have recently crashed \(RECENT_MGR_MODULE_CRASH\)
-        - \(POOL_APP_NOT_ENABLED\)
-  - cephfs_test_runner:
-      modules:
-        - tasks.mgr.test_module_selftest
-      fail_on_skip: false
diff --git a/qa/suites/rados/mgr/tasks/per_module_finisher_stats.yaml b/qa/suites/rados/mgr/tasks/per_module_finisher_stats.yaml
deleted file mode 100644 (file)
index de1d592..0000000
+++ /dev/null
@@ -1,45 +0,0 @@
-tasks:
-  - install:
-  - ceph:
-      wait-for-scrub: false
-      log-ignorelist:
-        - \(POOL_APP_NOT_ENABLED\)
-  - check-counter:
-      counters:
-        mgr:
-            - name: "finisher-balancer.complete_latency.avgcount"
-              min: 1
-            - name: "finisher-balancer.queue_len"
-              expected_val: 0
-            - name: "finisher-crash.complete_latency.avgcount"
-              min: 2
-            - name: "finisher-crash.queue_len"
-              expected_val: 0
-            - name: "finisher-devicehealth.complete_latency.avgcount"
-              min: 1
-            - name: "finisher-devicehealth.queue_len"
-              expected_val: 0
-            - name: "finisher-iostat.complete_latency.avgcount"
-              min: 1
-            - name: "finisher-iostat.queue_len"
-              expected_val: 0
-            - name: "finisher-pg_autoscaler.complete_latency.avgcount"
-              min: 1
-            - name: "finisher-pg_autoscaler.queue_len"
-              expected_val: 0
-            - name: "finisher-progress.complete_latency.avgcount"
-              min: 2
-            - name: "finisher-progress.queue_len"
-              expected_val: 0
-            - name: "finisher-status.complete_latency.avgcount"
-              min: 2
-            - name: "finisher-status.queue_len"
-              expected_val: 0
-            - name: "finisher-telemetry.complete_latency.avgcount"
-              min: 2
-            - name: "finisher-telemetry.queue_len"
-              expected_val: 0
-  - workunit:
-      clients:
-        client.0:
-          - mgr/test_per_module_finisher.sh
diff --git a/qa/suites/rados/mgr/tasks/progress.yaml b/qa/suites/rados/mgr/tasks/progress.yaml
deleted file mode 100644 (file)
index 183a9a2..0000000
+++ /dev/null
@@ -1,30 +0,0 @@
-overrides:
-  ceph:
-    conf:
-      osd:
-        osd mclock profile: high_recovery_ops
-tasks:
-  - install:
-  - ceph:
-      config:
-        global:
-          osd pool default size : 3
-          osd pool default min size : 2
-      # tests may leave mgrs broken, so don't try and call into them
-      # to invoke e.g. pg dump during teardown.
-      wait-for-scrub: false
-      log-ignorelist:
-        - overall HEALTH_
-        - \(MGR_DOWN\)
-        - \(MDS_ALL_DOWN\)
-        - \(MDS_UP_LESS_THAN_MAX\)
-        - \(FS_WITH_FAILED_MDS\)
-        - \(FS_DEGRADED\)
-        - \(PG_
-        - \(OSDMAP_FLAGS\)
-        - replacing it with standby
-        - No standby daemons available
-        - \(POOL_APP_NOT_ENABLED\)
-  - cephfs_test_runner:
-      modules:
-        - tasks.mgr.test_progress
diff --git a/qa/suites/rados/mgr/tasks/prometheus.yaml b/qa/suites/rados/mgr/tasks/prometheus.yaml
deleted file mode 100644 (file)
index fd0e23a..0000000
+++ /dev/null
@@ -1,17 +0,0 @@
-
-tasks:
-  - install:
-  - ceph:
-      # tests may leave mgrs broken, so don't try and call into them
-      # to invoke e.g. pg dump during teardown.
-      wait-for-scrub: false
-      log-ignorelist:
-        - overall HEALTH_
-        - \(MGR_DOWN\)
-        - \(PG_
-        - replacing it with standby
-        - No standby daemons available
-        - \(POOL_APP_NOT_ENABLED\)
-  - cephfs_test_runner:
-      modules:
-        - tasks.mgr.test_prometheus
diff --git a/qa/suites/rados/mgr/tasks/workunits.yaml b/qa/suites/rados/mgr/tasks/workunits.yaml
deleted file mode 100644 (file)
index a482740..0000000
+++ /dev/null
@@ -1,17 +0,0 @@
-tasks:
-  - install:
-  - ceph:
-      # tests may leave mgrs broken, so don't try and call into them
-      # to invoke e.g. pg dump during teardown.
-      wait-for-scrub: false
-      log-ignorelist:
-        - overall HEALTH_
-        - \(MGR_DOWN\)
-        - \(PG_
-        - replacing it with standby
-        - No standby daemons available
-        - \(POOL_APP_NOT_ENABLED\)
-  - workunit:
-      clients:
-        client.0:
-          - mgr/test_localpool.sh