]> git.apps.os.sepia.ceph.com Git - ceph.git/commitdiff
qa/suites/rados/thrash-old-clients: do some thrashing with jewel and luminous clients 21679/head
authorSage Weil <sage@redhat.com>
Tue, 24 Apr 2018 17:08:07 +0000 (12:08 -0500)
committerSage Weil <sage@redhat.com>
Tue, 24 Apr 2018 21:14:36 +0000 (16:14 -0500)
Signed-off-by: Sage Weil <sage@redhat.com>
29 files changed:
qa/suites/rados/thrash-old-clients/% [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/0-size-min-size-overrides/2-size-2-min-size.yaml [new symlink]
qa/suites/rados/thrash-old-clients/0-size-min-size-overrides/3-size-2-min-size.yaml [new symlink]
qa/suites/rados/thrash-old-clients/1-install/jewel.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/1-install/luminous.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/backoff/normal.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/backoff/peering.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/backoff/peering_and_degraded.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/ceph.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/clusters/+ [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/clusters/openstack.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/clusters/two-plus-three.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/d-balancer/crush-compat.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/d-balancer/off.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/msgr [new symlink]
qa/suites/rados/thrash-old-clients/msgr-failures/fastclose.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/msgr-failures/few.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/msgr-failures/osd-delay.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/rados.yaml [new symlink]
qa/suites/rados/thrash-old-clients/rocksdb.yaml [new symlink]
qa/suites/rados/thrash-old-clients/thrashers/default.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/thrashers/mapgap.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/thrashers/morepggrow.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/thrashers/none.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/thrashers/pggrow.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/thrashosds-health.yaml [new symlink]
qa/suites/rados/thrash-old-clients/workloads/cache-snaps.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/workloads/radosbench.yaml [new file with mode: 0644]
qa/suites/rados/thrash-old-clients/workloads/snaps-few-objects.yaml [new file with mode: 0644]

diff --git a/qa/suites/rados/thrash-old-clients/% b/qa/suites/rados/thrash-old-clients/%
new file mode 100644 (file)
index 0000000..e69de29
diff --git a/qa/suites/rados/thrash-old-clients/0-size-min-size-overrides/2-size-2-min-size.yaml b/qa/suites/rados/thrash-old-clients/0-size-min-size-overrides/2-size-2-min-size.yaml
new file mode 120000 (symlink)
index 0000000..c429b07
--- /dev/null
@@ -0,0 +1 @@
+../../../../overrides/2-size-2-min-size.yaml
\ No newline at end of file
diff --git a/qa/suites/rados/thrash-old-clients/0-size-min-size-overrides/3-size-2-min-size.yaml b/qa/suites/rados/thrash-old-clients/0-size-min-size-overrides/3-size-2-min-size.yaml
new file mode 120000 (symlink)
index 0000000..8d529f0
--- /dev/null
@@ -0,0 +1 @@
+../../../../overrides/3-size-2-min-size.yaml
\ No newline at end of file
diff --git a/qa/suites/rados/thrash-old-clients/1-install/jewel.yaml b/qa/suites/rados/thrash-old-clients/1-install/jewel.yaml
new file mode 100644 (file)
index 0000000..b68ee3d
--- /dev/null
@@ -0,0 +1,7 @@
+tasks:
+- install:
+    branch: jewel
+    exclude_packages: ['ceph-mgr','libcephfs2','libcephfs-devel','libcephfs-dev']
+- install.upgrade:
+    mon.a:
+    mon.b:
diff --git a/qa/suites/rados/thrash-old-clients/1-install/luminous.yaml b/qa/suites/rados/thrash-old-clients/1-install/luminous.yaml
new file mode 100644 (file)
index 0000000..1961c89
--- /dev/null
@@ -0,0 +1,6 @@
+tasks:
+- install:
+    branch: luminous
+- install.upgrade:
+    mon.a:
+    mon.b:
diff --git a/qa/suites/rados/thrash-old-clients/backoff/normal.yaml b/qa/suites/rados/thrash-old-clients/backoff/normal.yaml
new file mode 100644 (file)
index 0000000..e69de29
diff --git a/qa/suites/rados/thrash-old-clients/backoff/peering.yaml b/qa/suites/rados/thrash-old-clients/backoff/peering.yaml
new file mode 100644 (file)
index 0000000..66d0611
--- /dev/null
@@ -0,0 +1,5 @@
+overrides:
+  ceph:
+    conf:
+      osd:
+        osd backoff on peering: true
diff --git a/qa/suites/rados/thrash-old-clients/backoff/peering_and_degraded.yaml b/qa/suites/rados/thrash-old-clients/backoff/peering_and_degraded.yaml
new file mode 100644 (file)
index 0000000..e610990
--- /dev/null
@@ -0,0 +1,6 @@
+overrides:
+  ceph:
+    conf:
+      osd:
+        osd backoff on peering: true
+        osd backoff on degraded: true
diff --git a/qa/suites/rados/thrash-old-clients/ceph.yaml b/qa/suites/rados/thrash-old-clients/ceph.yaml
new file mode 100644 (file)
index 0000000..5df450d
--- /dev/null
@@ -0,0 +1,2 @@
+tasks:
+- ceph:
diff --git a/qa/suites/rados/thrash-old-clients/clusters/+ b/qa/suites/rados/thrash-old-clients/clusters/+
new file mode 100644 (file)
index 0000000..e69de29
diff --git a/qa/suites/rados/thrash-old-clients/clusters/openstack.yaml b/qa/suites/rados/thrash-old-clients/clusters/openstack.yaml
new file mode 100644 (file)
index 0000000..b0f3b9b
--- /dev/null
@@ -0,0 +1,4 @@
+openstack:
+  - volumes: # attached to each instance
+      count: 4
+      size: 30 # GB
diff --git a/qa/suites/rados/thrash-old-clients/clusters/two-plus-three.yaml b/qa/suites/rados/thrash-old-clients/clusters/two-plus-three.yaml
new file mode 100644 (file)
index 0000000..fc86b98
--- /dev/null
@@ -0,0 +1,13 @@
+roles:
+- [mon.a, mon.c, mgr.y, osd.0, osd.1, osd.2, osd.3, client.0]
+- [mon.b, mgr.x, osd.4, osd.5, osd.6, osd.7, client.1]
+- [client.2]
+openstack:
+- volumes: # attached to each instance
+    count: 4
+    size: 10 # GB
+overrides:
+  ceph:
+    conf:
+      osd:
+        osd shutdown pgref assert: true
diff --git a/qa/suites/rados/thrash-old-clients/d-balancer/crush-compat.yaml b/qa/suites/rados/thrash-old-clients/d-balancer/crush-compat.yaml
new file mode 100644 (file)
index 0000000..aa86766
--- /dev/null
@@ -0,0 +1,6 @@
+tasks:
+- exec:
+    mon.a:
+      - while ! ceph balancer status ; do sleep 1 ; done
+      - ceph balancer mode crush-compat
+      - ceph balancer on
diff --git a/qa/suites/rados/thrash-old-clients/d-balancer/off.yaml b/qa/suites/rados/thrash-old-clients/d-balancer/off.yaml
new file mode 100644 (file)
index 0000000..e69de29
diff --git a/qa/suites/rados/thrash-old-clients/msgr b/qa/suites/rados/thrash-old-clients/msgr
new file mode 120000 (symlink)
index 0000000..b29ecdd
--- /dev/null
@@ -0,0 +1 @@
+../basic/msgr
\ No newline at end of file
diff --git a/qa/suites/rados/thrash-old-clients/msgr-failures/fastclose.yaml b/qa/suites/rados/thrash-old-clients/msgr-failures/fastclose.yaml
new file mode 100644 (file)
index 0000000..77fd730
--- /dev/null
@@ -0,0 +1,6 @@
+overrides:
+  ceph:
+    conf:
+      global:
+        ms inject socket failures: 2500
+        ms tcp read timeout: 5
diff --git a/qa/suites/rados/thrash-old-clients/msgr-failures/few.yaml b/qa/suites/rados/thrash-old-clients/msgr-failures/few.yaml
new file mode 100644 (file)
index 0000000..477bffe
--- /dev/null
@@ -0,0 +1,7 @@
+overrides:
+  ceph:
+    conf:
+      global:
+        ms inject socket failures: 5000
+      osd:
+        osd heartbeat use min delay socket: true
diff --git a/qa/suites/rados/thrash-old-clients/msgr-failures/osd-delay.yaml b/qa/suites/rados/thrash-old-clients/msgr-failures/osd-delay.yaml
new file mode 100644 (file)
index 0000000..a33ba89
--- /dev/null
@@ -0,0 +1,9 @@
+overrides:
+  ceph:
+    conf:
+      global:
+        ms inject socket failures: 2500
+        ms inject delay type: osd
+        ms inject delay probability: .005
+        ms inject delay max: 1
+        ms inject internal delays: .002
diff --git a/qa/suites/rados/thrash-old-clients/rados.yaml b/qa/suites/rados/thrash-old-clients/rados.yaml
new file mode 120000 (symlink)
index 0000000..b756e57
--- /dev/null
@@ -0,0 +1 @@
+../../../config/rados.yaml
\ No newline at end of file
diff --git a/qa/suites/rados/thrash-old-clients/rocksdb.yaml b/qa/suites/rados/thrash-old-clients/rocksdb.yaml
new file mode 120000 (symlink)
index 0000000..f26e095
--- /dev/null
@@ -0,0 +1 @@
+../../../mon_kv_backend/rocksdb.yaml
\ No newline at end of file
diff --git a/qa/suites/rados/thrash-old-clients/thrashers/default.yaml b/qa/suites/rados/thrash-old-clients/thrashers/default.yaml
new file mode 100644 (file)
index 0000000..e8e2007
--- /dev/null
@@ -0,0 +1,24 @@
+overrides:
+  ceph:
+    log-whitelist:
+    - but it is still running
+    - objects unfound and apparently lost
+    conf:
+      osd:
+        osd debug reject backfill probability: .3
+        osd scrub min interval: 60
+        osd scrub max interval: 120
+        osd max backfills: 3
+        osd snap trim sleep: 2
+      mon:
+        mon min osdmap epochs: 50
+        paxos service trim min: 10
+        # prune full osdmaps regularly
+        mon osdmap full prune min: 15
+        mon osdmap full prune interval: 2
+        mon osdmap full prune txsize: 2
+tasks:
+- thrashosds:
+    timeout: 1200
+    chance_pgnum_grow: 1
+    chance_pgpnum_fix: 1
diff --git a/qa/suites/rados/thrash-old-clients/thrashers/mapgap.yaml b/qa/suites/rados/thrash-old-clients/thrashers/mapgap.yaml
new file mode 100644 (file)
index 0000000..7b55097
--- /dev/null
@@ -0,0 +1,26 @@
+overrides:
+  ceph:
+    log-whitelist:
+    - but it is still running
+    - objects unfound and apparently lost
+    - osd_map_cache_size
+    conf:
+      mon:
+        mon min osdmap epochs: 50
+        paxos service trim min: 10
+        # prune full osdmaps regularly
+        mon osdmap full prune min: 15
+        mon osdmap full prune interval: 2
+        mon osdmap full prune txsize: 2
+      osd:
+        osd map cache size: 1
+        osd scrub min interval: 60
+        osd scrub max interval: 120
+        osd scrub during recovery: false
+        osd max backfills: 6
+tasks:
+- thrashosds:
+    timeout: 1800
+    chance_pgnum_grow: 0.25
+    chance_pgpnum_fix: 0.25
+    chance_test_map_discontinuity: 2
diff --git a/qa/suites/rados/thrash-old-clients/thrashers/morepggrow.yaml b/qa/suites/rados/thrash-old-clients/thrashers/morepggrow.yaml
new file mode 100644 (file)
index 0000000..91d2173
--- /dev/null
@@ -0,0 +1,22 @@
+overrides:
+  ceph:
+    conf:
+      osd:
+        osd scrub min interval: 60
+        osd scrub max interval: 120
+        journal throttle high multiple: 2
+        journal throttle max multiple: 10
+        filestore queue throttle high multiple: 2
+        filestore queue throttle max multiple: 10
+        osd max backfills: 9
+    log-whitelist:
+    - but it is still running
+    - objects unfound and apparently lost
+tasks:
+- thrashosds:
+    timeout: 1200
+    chance_pgnum_grow: 3
+    chance_pgpnum_fix: 1
+openstack:
+- volumes:
+    size: 50
diff --git a/qa/suites/rados/thrash-old-clients/thrashers/none.yaml b/qa/suites/rados/thrash-old-clients/thrashers/none.yaml
new file mode 100644 (file)
index 0000000..e69de29
diff --git a/qa/suites/rados/thrash-old-clients/thrashers/pggrow.yaml b/qa/suites/rados/thrash-old-clients/thrashers/pggrow.yaml
new file mode 100644 (file)
index 0000000..8721fd1
--- /dev/null
@@ -0,0 +1,24 @@
+overrides:
+  ceph:
+    log-whitelist:
+    - but it is still running
+    - objects unfound and apparently lost
+    conf:
+      osd:
+        osd scrub min interval: 60
+        osd scrub max interval: 120
+        filestore odsync write: true
+        osd max backfills: 2
+        osd snap trim sleep: .5
+      mon:
+        mon min osdmap epochs: 50
+        paxos service trim min: 10
+        # prune full osdmaps regularly
+        mon osdmap full prune min: 15
+        mon osdmap full prune interval: 2
+        mon osdmap full prune txsize: 2
+tasks:
+- thrashosds:
+    timeout: 1200
+    chance_pgnum_grow: 2
+    chance_pgpnum_fix: 1
diff --git a/qa/suites/rados/thrash-old-clients/thrashosds-health.yaml b/qa/suites/rados/thrash-old-clients/thrashosds-health.yaml
new file mode 120000 (symlink)
index 0000000..ebf7f34
--- /dev/null
@@ -0,0 +1 @@
+../../../tasks/thrashosds-health.yaml
\ No newline at end of file
diff --git a/qa/suites/rados/thrash-old-clients/workloads/cache-snaps.yaml b/qa/suites/rados/thrash-old-clients/workloads/cache-snaps.yaml
new file mode 100644 (file)
index 0000000..fc1f5b4
--- /dev/null
@@ -0,0 +1,34 @@
+overrides:
+  ceph:
+    log-whitelist:
+      - must scrub before tier agent can activate
+tasks:
+- exec:
+    client.0:
+      - sudo ceph osd pool create base 4
+      - sudo ceph osd pool application enable base rados
+      - sudo ceph osd pool create cache 4
+      - sudo ceph osd tier add base cache
+      - sudo ceph osd tier cache-mode cache writeback
+      - sudo ceph osd tier set-overlay base cache
+      - sudo ceph osd pool set cache hit_set_type bloom
+      - sudo ceph osd pool set cache hit_set_count 8
+      - sudo ceph osd pool set cache hit_set_period 3600
+      - sudo ceph osd pool set cache target_max_objects 250
+      - sudo ceph osd pool set cache min_read_recency_for_promote 2
+- rados:
+    clients: [client.2]
+    pools: [base]
+    ops: 4000
+    objects: 500
+    op_weights:
+      read: 100
+      write: 100
+      delete: 50
+      copy_from: 50
+      cache_flush: 50
+      cache_try_flush: 50
+      cache_evict: 50
+      snap_create: 50
+      snap_remove: 50
+      rollback: 50
diff --git a/qa/suites/rados/thrash-old-clients/workloads/radosbench.yaml b/qa/suites/rados/thrash-old-clients/workloads/radosbench.yaml
new file mode 100644 (file)
index 0000000..6a89a4e
--- /dev/null
@@ -0,0 +1,33 @@
+overrides:
+  ceph:
+    conf:
+      client.2:
+        debug ms: 1
+        debug objecter: 20
+        debug rados: 20
+tasks:
+- full_sequential:
+  - radosbench:
+      clients: [client.2]
+      time: 90
+  - radosbench:
+      clients: [client.2]
+      time: 90
+  - radosbench:
+      clients: [client.2]
+      time: 90
+  - radosbench:
+      clients: [client.2]
+      time: 90
+  - radosbench:
+      clients: [client.2]
+      time: 90
+  - radosbench:
+      clients: [client.2]
+      time: 90
+  - radosbench:
+      clients: [client.2]
+      time: 90
+  - radosbench:
+      clients: [client.2]
+      time: 90
diff --git a/qa/suites/rados/thrash-old-clients/workloads/snaps-few-objects.yaml b/qa/suites/rados/thrash-old-clients/workloads/snaps-few-objects.yaml
new file mode 100644 (file)
index 0000000..f0a5735
--- /dev/null
@@ -0,0 +1,13 @@
+tasks:
+- rados:
+    clients: [client.2]
+    ops: 4000
+    objects: 50
+    op_weights:
+      read: 100
+      write: 100
+      delete: 50
+      snap_create: 50
+      snap_remove: 50
+      rollback: 50
+      copy_from: 50