- 'attr name mistmatch'
- 'deep-scrub 1 missing, 0 inconsistent objects'
- 'failed to pick suitable auth object'
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
+ - HEALTH_ERR PG_
+ - HEALTH_ERR OSD_SCRUB_ERRORS
+ - HEALTH_WARN TOO_FEW_PGS
conf:
osd:
osd deep scrub update digest min age: 0
+override:
+ ceph:
+ log-whitelist:
+ - HEALTH_WARN OSD_CACHE_NO_HIT_SET
+ - HEALTH_WARN TOO_FEW_PGS
tasks:
- workunit:
clients:
- 'size 1 != size'
- attr name mismatch
- Regular scrub request, losing deep-scrub details
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
conf:
osd:
filestore debug inject read err: true
- ceph:
# tests may leave mgrs broken, so don't try and call into them
# to invoke e.g. pg dump during teardown.
- wait-for-scrub: false
+ wait-for-scrub: false
+ log-whitelist:
+ - HEALTH_WRN MGR_DOWN
+ - HEALTH_ERR MGR_DOWN
- cephfs_test_runner:
modules:
- tasks.mgr.test_failover
+overrides:
+ ceph:
+ log-whitelist:
+ - HEALTH_WARN MON_DOWN
+ - HEALTH_WARN TOO_FEW_PGS
tasks:
- mon_thrash:
revive_delay: 90
overrides:
ceph:
+ log-whitelist:
+ - HEALTH_WARN MON_DOWN
conf:
osd:
mon client ping interval: 4
+overrides:
+ ceph:
+ log-whitelist:
+ - HEALTH_WARN MON_DOWN
tasks:
- mon_thrash:
revive_delay: 20
overrides:
ceph:
+ log-whitelist:
+ - HEALTH_WARN MON_DOWN
conf:
mon:
paxos min: 10
overrides:
ceph:
+ log-whitelist:
+ - HEALTH_WARN MON_DOWN
conf:
mon:
paxos min: 10
- slow request
- .*clock.*skew.*
- clocks not synchronized
+ - HEALTH_WARN MON_CLOCK_SKEW
- mon_clock_skew_check:
expect-skew: false
- slow request
- .*clock.*skew.*
- clocks not synchronized
+ - HEALTH_WARN MON_CLOCK_SKEW
- mon_clock_skew_check:
expect-skew: true
global:
osd max object name len: 460
osd max object namespace len: 64
+ log-whitelist:
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
+ - HEALTH_ERR PG_
+ - HEALTH_WARN TOO_FEW_PGS
- ceph_objectstore_tool:
objects: 20
- must scrub before tier agent can activate
- failsafe engaged, dropping updates
- failsafe disengaged, no longer dropping updates
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
+ - HEALTH_ERR PG_
+ - HEALTH_WARN SMALLER_PG_NUM
- workunit:
clients:
all:
log-whitelist:
- MDS in read-only mode
- force file system read-only
+ - HEALTH_WARN OSD_FLAGS
+ - HEALTH_ERR OSD_FULL
+ - HEALTH_WARN MDS_READ_ONLY
tasks:
- install:
- ceph:
tasks:
- install:
- ceph:
+ log-whitelist:
+ - HEALTH_WARN OSD_CACHE_NO_HIT_SET
conf:
global:
osd max object name len: 460
ceph:
log-whitelist:
- is full
+ - HEALTH_ERR POOL_FULL
+ - HEALTH_WARN POOL_NEAR_FULL
tasks:
- install:
- ceph:
osd max object namespace len: 64
log-whitelist:
- wrongly marked me down
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
- workunit:
clients:
all:
overrides:
ceph:
+ log-whitelist:
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
+ - HEALTH_WARN DEGRADED_OBJECTS
conf:
osd:
debug osd: 5
overrides:
ceph:
+ log-whitelist:
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
+ - HEALTH_WARN DEGRADED_OBJECTS
conf:
osd:
debug osd: 5
- install:
- ceph:
log-whitelist:
- - wrongly marked me down
+ - wrongly marked me down
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
- dump_stuck:
- install:
- ceph:
log-whitelist:
- - objects unfound and apparently lost
+ - objects unfound and apparently lost
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
+ - HEALTH_WARN UNFOUND_OBJECTS
+ - HEALTH_WARN DEGRADED_OBJECTS
- ec_lost_unfound:
- install:
- ceph:
log-whitelist:
- - objects unfound and apparently lost
+ - objects unfound and apparently lost
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
+ - HEALTH_ERR PG_
+ - HEALTH_WARN UNFOUND_OBJECTS
+ - HEALTH_WARN MISPLACED_OBJECTS
+ - HEALTH_WARN DEGRADED_OBJECTS
- rep_lost_unfound_delete:
- install:
- ceph:
log-whitelist:
- - objects unfound and apparently lost
+ - objects unfound and apparently lost
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
+ - HEALTH_ERR PG_
+ - HEALTH_WARN UNFOUND_OBJECTS
+ - HEALTH_WARN MISPLACED_OBJECTS
+ - HEALTH_WARN DEGRADED_OBJECTS
- lost_unfound:
- install:
- ceph:
log-whitelist:
- - wrongly marked me down
+ - wrongly marked me down
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
conf:
osd:
osd min pg log entries: 5
- install:
- ceph:
log-whitelist:
- - wrongly marked me down
+ - wrongly marked me down
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
conf:
osd:
osd min pg log entries: 5
- install:
- ceph:
log-whitelist:
- - wrongly marked me down
+ - wrongly marked me down
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
conf:
osd:
osd min pg log entries: 5
global:
osd pool default min size : 1
log-whitelist:
- - objects unfound and apparently lost
+ - objects unfound and apparently lost
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
- peer:
- install:
- ceph:
log-whitelist:
- - wrongly marked me down
- - slow request
+ - wrongly marked me down
+ - slow request
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
- exec:
client.0:
- sudo ceph osd pool create foo 128 128
- install:
- ceph:
log-whitelist:
- - no reply from
+ - no reply from
+ - HEALTH_WARN MON_DOWN
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN PG_
- full_sequential:
- radosbench:
clients: [client.0]
+++ /dev/null
-roles:
-- - mon.a
- - mgr.x
- - osd.0
- - osd.1
- - osd.2
-- - osd.3
- - osd.4
- - osd.5
- - client.0
-openstack:
- - volumes: # attached to each instance
- count: 3
- size: 10 # GB
-tasks:
-- install:
-- ceph:
- log-whitelist:
- - wrongly marked me down
-- thrashosds:
- op_delay: 30
- clean_interval: 120
- chance_down: .5
-- workunit:
- clients:
- all:
- - rados/load-gen-mix-small.sh
--- /dev/null
+roles:
+- - mon.a
+ - mgr.x
+ - osd.0
+ - osd.1
+ - osd.2
+- - osd.3
+ - osd.4
+ - osd.5
+ - client.0
+openstack:
+ - volumes: # attached to each instance
+ count: 3
+ size: 10 # GB
+tasks:
+- install:
+- ceph:
+ log-whitelist:
+ - wrongly marked me down
+- thrashosds:
+ op_delay: 30
+ clean_interval: 120
+ chance_down: .5
+- workunit:
+ clients:
+ all:
+ - rados/load-gen-mix-small.sh
--- /dev/null
+../../../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+../../../../tasks/thrashosds-health.yaml
\ No newline at end of file
+++ /dev/null
-overrides:
- ceph:
- log-whitelist:
- - wrongly marked me down
- - objects unfound and apparently lost
-tasks:
-- thrashosds:
- timeout: 1200
- chance_pgnum_grow: 1
- chance_pgpnum_fix: 1
--- /dev/null
+overrides:
+ ceph:
+ log-whitelist:
+ - wrongly marked me down
+ - objects unfound and apparently lost
+tasks:
+- thrashosds:
+ timeout: 1200
+ chance_pgnum_grow: 1
+ chance_pgpnum_fix: 1
--- /dev/null
+../../../../../tasks/thrashosds-health.yaml
\ No newline at end of file
--- /dev/null
+override:
+ ceph:
+ log-whitelist:
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN OSD_
+ - HEALTH_WARN OSDMAP_FLAGS
+ - HEALTH_WARN PG_
+ - HEALTH_ERR OSD_
+ - HEALTH_ERR PG_
+ - HEALTH_WARN SMALLER_PGP_NUM
+ - HEALTH_WARN DEGRADED_OBJECTS
+ - HEALTH_WARN MISPLACED_OBJECTS
+ - HEALTH_WARN SLOW_REQUESTS
+ - HEALTH_WARN TOO_FEW_PGS