alert: 'NVMeoFSubsystemNamespaceLimit',
'for': '1m',
expr: '(count by(nqn, cluster, instance) (ceph_nvmeof_subsystem_namespace_metadata)) >= on(nqn, instance) group_right(cluster) ceph_nvmeof_subsystem_namespace_limit',
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'subsystem' },
annotations: {
summary: '{{ $labels.nqn }} subsystem has reached its maximum number of namespaces%(cluster)s' % $.MultiClusterSummary(),
description: 'Subsystems have a max namespace limit defined at creation time. This alert means that no more namespaces can be added to {{ $labels.nqn }}',
alert: 'NVMeoFMultipleNamespacesOfRBDImage',
'for': '1m',
expr: 'count by(pool_name, rbd_name) (count by(bdev_name, pool_name, rbd_name) (ceph_nvmeof_bdev_metadata and on (bdev_name) ceph_nvmeof_subsystem_namespace_metadata)) > 1',
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'namespace' },
annotations: {
summary: 'RBD image {{ $labels.pool_name }}/{{ $labels.rbd_name }} cannot be reused for multiple NVMeoF namespace ',
description: 'Each NVMeoF namespace must have a unique RBD pool and image, across all different gateway groups.',
alert: 'NVMeoFTooManyGateways',
'for': '1m',
expr: 'count(ceph_nvmeof_gateway_info) by (cluster) > %.2f' % [$._config.NVMeoFMaxGatewaysPerCluster],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'gateway' },
annotations: {
summary: 'Max supported gateways exceeded%(cluster)s' % $.MultiClusterSummary(),
description: 'You may create many gateways, but %(NVMeoFMaxGatewaysPerCluster)d is the tested limit' % $._config,
alert: 'NVMeoFMaxGatewayGroupSize',
'for': '1m',
expr: 'count(ceph_nvmeof_gateway_info) by (cluster,group) > %.2f' % [$._config.NVMeoFMaxGatewaysPerGroup],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'gateway' },
annotations: {
summary: 'Max gateways within a gateway group ({{ $labels.group }}) exceeded%(cluster)s' % $.MultiClusterSummary(),
description: 'You may create many gateways in a gateway group, but %(NVMeoFMaxGatewaysPerGroup)d is the tested limit' % $._config,
alert: 'NVMeoFMaxGatewayGroups',
'for': '1m',
expr: 'count(count by (group, cluster) (ceph_nvmeof_gateway_info)) by (cluster) > %.2f' % [$._config.NVMeoFMaxGatewayGroups],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'gateway' },
annotations: {
summary: 'Max gateway groups exceeded%(cluster)s' % $.MultiClusterSummary(),
description: 'You may create many gateway groups, but %(NVMeoFMaxGatewayGroups)d is the tested limit' % $._config,
alert: 'NVMeoFSingleGateway',
'for': '5m',
expr: 'count(ceph_nvmeof_gateway_info) by(cluster,group) == 1',
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'gateway' },
annotations: {
summary: 'The gateway group {{ $labels.group }} consists of a single gateway - HA is not possible%(cluster)s' % $.MultiClusterSummary(),
description: 'Although a single member gateway group is valid, it should only be used for test purposes',
alert: 'NVMeoFHighGatewayCPU',
'for': '10m',
expr: 'label_replace(avg by(instance, cluster) (rate(ceph_nvmeof_reactor_seconds_total{mode="busy"}[1m])),"instance","$1","instance","(.*):.*") > %.2f' % [$._config.NVMeoFHighGatewayCPU],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'gateway' },
annotations: {
summary: 'CPU used by {{ $labels.instance }} NVMe-oF Gateway is high%(cluster)s' % $.MultiClusterSummary(),
description: 'Typically, high CPU may indicate degraded performance. Consider increasing the number of reactor cores',
alert: 'NVMeoFGatewayOpenSecurity',
'for': '5m',
expr: 'ceph_nvmeof_subsystem_metadata{allow_any_host="yes"}',
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'subsystem' },
annotations: {
summary: 'Subsystem {{ $labels.nqn }} has been defined without host level security%(cluster)s' % $.MultiClusterSummary(),
description: 'It is good practice to ensure subsystems use host security to reduce the risk of unexpected data loss',
alert: 'NVMeoFTooManySubsystems',
'for': '1m',
expr: 'count by(gateway_host, cluster) (label_replace(ceph_nvmeof_subsystem_metadata,"gateway_host","$1","instance","(.*?)(?::.*)?")) >= %.2f' % [$._config.NVMeoFMaxSubsystemsPerGateway],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'subsystem' },
annotations: {
summary: 'The number of subsystems defined to the NVMeoF gateway reached or exceeded the supported values%(cluster)s' % $.MultiClusterSummary(),
description: 'NVMeoF gateway {{ $labels.gateway_host }} has reached or exceeded the supported maximum of %(NVMeoFMaxSubsystemsPerGateway)d subsystems. Current count: {{ $value }}.' % $._config,
alert: 'NVMeoFTooManyNamespaces',
'for': '1m',
expr: 'sum by(gateway_host, cluster) (label_replace(ceph_nvmeof_subsystem_namespace_count,"gateway_host","$1","instance","(.*?)(?::.*)?")) >= %.2f' % [$._config.NVMeoFMaxNamespaces],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'namespace' },
annotations: {
summary: 'The number of namespaces defined to the NVMeoF gateway reached or exceeded supported values%(cluster)s' % $.MultiClusterSummary(),
description: 'NVMeoF gateway {{ $labels.gateway_host }} has reached or exceeded the supported maximum of %(NVMeoFMaxNamespaces)d namespaces. Current count: {{ $value }}.' % $._config,
alert: 'NVMeoFVersionMismatch',
'for': '1h',
expr: 'count(count(ceph_nvmeof_gateway_info) by (cluster, version)) by (cluster) > 1',
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'gateway' },
annotations: {
summary: 'Too many different NVMe-oF gateway releases active%(cluster)s' % $.MultiClusterSummary(),
description: 'This may indicate an issue with deployment. Check cephadm logs',
alert: 'NVMeoFHighClientCount',
'for': '1m',
expr: 'ceph_nvmeof_subsystem_host_count > %.2f' % [$._config.NVMeoFHighClientCount],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'subsystem' },
annotations: {
summary: 'The number of clients connected to {{ $labels.nqn }} is too high%(cluster)s' % $.MultiClusterSummary(),
description: 'The supported limit for clients connecting to a subsystem is %(NVMeoFHighClientCount)d' % $._config,
alert: 'NVMeoFMissingListener',
'for': '10m',
expr: 'ceph_nvmeof_subsystem_listener_count == 0 and on(nqn) sum(ceph_nvmeof_subsystem_listener_count) by (nqn) > 0',
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'listener' },
annotations: {
summary: 'No listener added for {{ $labels.instance }} NVMe-oF Gateway to {{ $labels.nqn }} subsystem',
description: 'For every subsystem, each gateway should have a listener to balance traffic between gateways.',
alert: 'NVMeoFZeroListenerSubsystem',
'for': '10m',
expr: 'sum(ceph_nvmeof_subsystem_listener_count) by (nqn) == 0',
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'listener' },
annotations: {
summary: 'No listeners added to {{ $labels.nqn }} subsystem',
description: 'NVMeoF gateway configuration incomplete; one of the subsystems have zero listeners.',
alert: 'NVMeoFHighHostCPU',
'for': '10m',
expr: '100-((100*(avg by(cluster,host) (label_replace(rate(node_cpu_seconds_total{mode="idle"}[5m]),"host","$1","instance","(.*):.*")) * on(cluster, host) group_right label_replace(ceph_nvmeof_gateway_info,"host","$1","instance","(.*):.*")))) >= %.2f' % [$._config.NVMeoFHighHostCPU],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'host' },
annotations: {
summary: 'The CPU is high ({{ $value }}%%) on NVMeoF Gateway host ({{ $labels.host }})%(cluster)s' % $.MultiClusterSummary(),
description: 'High CPU on a gateway host can lead to CPU contention and performance degradation',
alert: 'NVMeoFInterfaceDown',
'for': '30s',
expr: 'ceph_nvmeof_subsystem_listener_iface_info{operstate="down"}',
- labels: { severity: 'warning', type: 'ceph_default', oid: '1.3.6.1.4.1.50495.1.2.1.14.1' },
+ labels: { severity: 'warning', type: 'ceph_default', oid: '1.3.6.1.4.1.50495.1.2.1.14.1', category: 'listener' },
annotations: {
summary: 'Network interface {{ $labels.device }} is down%(cluster)s' % $.MultiClusterSummary(),
description: 'A NIC used by one or more subsystems is in a down state',
alert: 'NVMeoFInterfaceDuplex',
'for': '30s',
expr: 'ceph_nvmeof_subsystem_listener_iface_info{duplex!="full"}',
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'listener' },
annotations: {
summary: 'Network interface {{ $labels.device }} is not running in full duplex mode%(cluster)s' % $.MultiClusterSummary(),
description: 'Until this is resolved, performance from the gateway will be degraded',
alert: 'NVMeoFHighReadLatency',
'for': '5m',
expr: 'label_replace((avg by(instance) ((rate(ceph_nvmeof_bdev_read_seconds_total[1m]) / rate(ceph_nvmeof_bdev_reads_completed_total[1m])))),"gateway","$1","instance","(.*):.*") > %.2f' % [$._config.NVMeoFHighClientReadLatency / 1000],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'performance' },
annotations: {
summary: 'The average read latency over the last 5 mins has reached %(NVMeoFHighClientReadLatency)d ms or more on {{ $labels.gateway }}' % $._config,
description: 'High latencies may indicate a constraint within the cluster e.g. CPU, network. Please investigate',
alert: 'NVMeoFHighWriteLatency',
'for': '5m',
expr: 'label_replace((avg by(instance) ((rate(ceph_nvmeof_bdev_write_seconds_total[5m]) / rate(ceph_nvmeof_bdev_writes_completed_total[5m])))),"gateway","$1","instance","(.*):.*") > %.2f' % [$._config.NVMeoFHighClientWriteLatency / 1000],
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'performance' },
annotations: {
summary: 'The average write latency over the last 5 mins has reached %(NVMeoFHighClientWriteLatency)d ms or more on {{ $labels.gateway }}' % $._config,
description: 'High latencies may indicate a constraint within the cluster e.g. CPU, network. Please investigate',
alert: 'NVMeoFHostKeepAliveTimeout',
'for': '1m',
expr: 'ceil(changes(ceph_nvmeof_host_keepalive_timeout[%(NVMeoFHostKeepAliveTimeoutTrackDurationHours)dh:]) / 2) > 0' % $._config,
- labels: { severity: 'warning', type: 'ceph_default' },
+ labels: { severity: 'warning', type: 'ceph_default', category: 'host' },
annotations: {
summary: 'Host ({{ $labels.host_nqn }}) was disconnected {{ $value }} times from subsystem ({{ $labels.nqn }}) in last %(NVMeoFHostKeepAliveTimeoutTrackDurationHours)d hours' % $._config,
description: 'Host was disconnected due to host keep alive timeout',
expr: "(count by(nqn, cluster, instance) (ceph_nvmeof_subsystem_namespace_metadata)) >= on(nqn, instance) group_right(cluster) ceph_nvmeof_subsystem_namespace_limit"
for: "1m"
labels:
+ category: "subsystem"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFMultipleNamespacesOfRBDImage"
expr: "count by(pool_name, rbd_name) (count by(bdev_name, pool_name, rbd_name) (ceph_nvmeof_bdev_metadata and on (bdev_name) ceph_nvmeof_subsystem_namespace_metadata)) > 1"
for: "1m"
labels:
+ category: "namespace"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFTooManyGateways"
expr: "count(ceph_nvmeof_gateway_info) by (cluster) > 32.00"
for: "1m"
labels:
+ category: "gateway"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFMaxGatewayGroupSize"
expr: "count(ceph_nvmeof_gateway_info) by (cluster,group) > 8.00"
for: "1m"
labels:
+ category: "gateway"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFMaxGatewayGroups"
expr: "count(count by (group, cluster) (ceph_nvmeof_gateway_info)) by (cluster) > 4.00"
for: "1m"
labels:
+ category: "gateway"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFSingleGateway"
expr: "count(ceph_nvmeof_gateway_info) by(cluster,group) == 1"
for: "5m"
labels:
+ category: "gateway"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFHighGatewayCPU"
expr: "label_replace(avg by(instance, cluster) (rate(ceph_nvmeof_reactor_seconds_total{mode=\"busy\"}[1m])),\"instance\",\"$1\",\"instance\",\"(.*):.*\") > 80.00"
for: "10m"
labels:
+ category: "gateway"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFGatewayOpenSecurity"
expr: "ceph_nvmeof_subsystem_metadata{allow_any_host=\"yes\"}"
for: "5m"
labels:
+ category: "subsystem"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFTooManySubsystems"
expr: "count by(gateway_host, cluster) (label_replace(ceph_nvmeof_subsystem_metadata,\"gateway_host\",\"$1\",\"instance\",\"(.*?)(?::.*)?\")) >= 128.00"
for: "1m"
labels:
+ category: "subsystem"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFTooManyNamespaces"
expr: "sum by(gateway_host, cluster) (label_replace(ceph_nvmeof_subsystem_namespace_count,\"gateway_host\",\"$1\",\"instance\",\"(.*?)(?::.*)?\")) >= 4096.00"
for: "1m"
labels:
+ category: "namespace"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFVersionMismatch"
expr: "count(count(ceph_nvmeof_gateway_info) by (cluster, version)) by (cluster) > 1"
for: "1h"
labels:
+ category: "gateway"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFHighClientCount"
expr: "ceph_nvmeof_subsystem_host_count > 128.00"
for: "1m"
labels:
+ category: "subsystem"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFMissingListener"
expr: "ceph_nvmeof_subsystem_listener_count == 0 and on(nqn) sum(ceph_nvmeof_subsystem_listener_count) by (nqn) > 0"
for: "10m"
labels:
+ category: "listener"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFZeroListenerSubsystem"
expr: "sum(ceph_nvmeof_subsystem_listener_count) by (nqn) == 0"
for: "10m"
labels:
+ category: "listener"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFHighHostCPU"
expr: "100-((100*(avg by(cluster,host) (label_replace(rate(node_cpu_seconds_total{mode=\"idle\"}[5m]),\"host\",\"$1\",\"instance\",\"(.*):.*\")) * on(cluster, host) group_right label_replace(ceph_nvmeof_gateway_info,\"host\",\"$1\",\"instance\",\"(.*):.*\")))) >= 80.00"
for: "10m"
labels:
+ category: "host"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFInterfaceDown"
expr: "ceph_nvmeof_subsystem_listener_iface_info{operstate=\"down\"}"
for: "30s"
labels:
+ category: "listener"
oid: "1.3.6.1.4.1.50495.1.2.1.14.1"
severity: "warning"
type: "ceph_default"
expr: "ceph_nvmeof_subsystem_listener_iface_info{duplex!=\"full\"}"
for: "30s"
labels:
+ category: "listener"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFHighReadLatency"
expr: "label_replace((avg by(instance) ((rate(ceph_nvmeof_bdev_read_seconds_total[1m]) / rate(ceph_nvmeof_bdev_reads_completed_total[1m])))),\"gateway\",\"$1\",\"instance\",\"(.*):.*\") > 0.01"
for: "5m"
labels:
+ category: "performance"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFHighWriteLatency"
expr: "label_replace((avg by(instance) ((rate(ceph_nvmeof_bdev_write_seconds_total[5m]) / rate(ceph_nvmeof_bdev_writes_completed_total[5m])))),\"gateway\",\"$1\",\"instance\",\"(.*):.*\") > 0.02"
for: "5m"
labels:
+ category: "performance"
severity: "warning"
type: "ceph_default"
- alert: "NVMeoFHostKeepAliveTimeout"
expr: "ceil(changes(ceph_nvmeof_host_keepalive_timeout[24h:]) / 2) > 0"
for: "1m"
labels:
+ category: "host"
severity: "warning"
type: "ceph_default"
- name: "certmgr"
severity: warning
cluster: mycluster
type: ceph_default
+ category: subsystem
exp_annotations:
summary: "wah subsystem has reached its maximum number of namespaces on cluster mycluster"
description: "Subsystems have a max namespace limit defined at creation time. This alert means that no more namespaces can be added to wah"
exp_alerts:
- exp_labels:
pool_name: mypool
- rbd_name: myimage1
+ rbd_name: myimage1
severity: warning
type: ceph_default
+ category: namespace
exp_annotations:
summary: "RBD image mypool/myimage1 cannot be reused for multiple NVMeoF namespace "
description: "Each NVMeoF namespace must have a unique RBD pool and image, across all different gateway groups."
severity: warning
cluster: mycluster
type: ceph_default
+ category: gateway
exp_annotations:
summary: "Max supported gateways exceeded on cluster mycluster"
description: "You may create many gateways, but 32 is the tested limit"
severity: warning
cluster: mycluster
type: ceph_default
+ category: gateway
exp_annotations:
summary: "Max gateways within a gateway group (group-1) exceeded on cluster mycluster"
description: "You may create many gateways in a gateway group, but 8 is the tested limit"
severity: warning
cluster: mycluster
type: ceph_default
+ category: gateway
exp_annotations:
summary: "Max gateway groups exceeded on cluster mycluster"
description: "You may create many gateway groups, but 4 is the tested limit"
severity: warning
cluster: mycluster
type: ceph_default
+ category: gateway
exp_annotations:
summary: "The gateway group group-1 consists of a single gateway - HA is not possible on cluster mycluster"
description: "Although a single member gateway group is valid, it should only be used for test purposes"
severity: warning
cluster: mycluster
type: ceph_default
+ category: gateway
exp_annotations:
summary: "CPU used by node-1 NVMe-oF Gateway is high on cluster mycluster"
description: "Typically, high CPU may indicate degraded performance. Consider increasing the number of reactor cores"
severity: warning
cluster: mycluster
type: ceph_default
+ category: subsystem
exp_annotations:
summary: "Subsystem nqn.bad has been defined without host level security on cluster mycluster"
description: "It is good practice to ensure subsystems use host security to reduce the risk of unexpected data loss"
severity: warning
cluster: mycluster
type: ceph_default
+ category: subsystem
exp_annotations:
summary: "The number of subsystems defined to the NVMeoF gateway reached or exceeded the supported values on cluster mycluster"
description: "NVMeoF gateway node-1 has reached or exceeded the supported maximum of 128 subsystems. Current count: 129."
severity: warning
cluster: mycluster
type: ceph_default
+ category: namespace
exp_annotations:
summary: "The number of namespaces defined to the NVMeoF gateway reached or exceeded supported values on cluster mycluster"
description: "NVMeoF gateway node-1 has reached or exceeded the supported maximum of 4096 namespaces. Current count: 4400."
severity: warning
cluster: mycluster
type: ceph_default
+ category: gateway
exp_annotations:
summary: "Too many different NVMe-oF gateway releases active on cluster mycluster"
description: "This may indicate an issue with deployment. Check cephadm logs"
severity: warning
cluster: mycluster
type: ceph_default
+ category: subsystem
exp_annotations:
summary: "The number of clients connected to nqn1 is too high on cluster mycluster"
description: "The supported limit for clients connecting to a subsystem is 128"
nqn: nqn1
severity: warning
type: ceph_default
+ category: listener
exp_annotations:
summary: "No listener added for node-1:9100 NVMe-oF Gateway to nqn1 subsystem"
description: "For every subsystem, each gateway should have a listener to balance traffic between gateways."
nqn: nqn1
severity: warning
type: ceph_default
+ category: listener
exp_annotations:
summary: "No listeners added to nqn1 subsystem"
description: "NVMeoF gateway configuration incomplete; one of the subsystems have zero listeners."
cluster: mycluster
severity: warning
type: ceph_default
+ category: host
exp_annotations:
summary: "The CPU is high (85%) on NVMeoF Gateway host (node-1) on cluster mycluster"
description: "High CPU on a gateway host can lead to CPU contention and performance degradation"
cluster: mycluster
severity: warning
type: ceph_default
+ category: listener
exp_annotations:
summary: "Network interface eth0 is down on cluster mycluster"
description: "A NIC used by one or more subsystems is in a down state"
cluster: mycluster
severity: warning
type: ceph_default
+ category: listener
exp_annotations:
summary: "Network interface eth1 is not running in full duplex mode on cluster mycluster"
description: "Until this is resolved, performance from the gateway will be degraded"
instance: node-1:10008
severity: warning
type: ceph_default
+ category: performance
exp_annotations:
summary: "The average read latency over the last 5 mins has reached 10 ms or more on node-1"
description: "High latencies may indicate a constraint within the cluster e.g. CPU, network. Please investigate"
instance: node-1:10008
severity: warning
type: ceph_default
+ category: performance
exp_annotations:
summary: "The average write latency over the last 5 mins has reached 20 ms or more on node-1"
description: "High latencies may indicate a constraint within the cluster e.g. CPU, network. Please investigate"
nqn: nqn.2016-06.io.spdk:cnode1.mygroup
severity: warning
type: ceph_default
+ category: host
exp_annotations:
summary: "Host (nqn.1) was disconnected 3 times from subsystem (nqn.2016-06.io.spdk:cnode1.mygroup) in last 24 hours"
description: "Host was disconnected due to host keep alive timeout"
nqn: nqn.2016-06.io.spdk:cnode1.mygroup
severity: warning
type: ceph_default
+ category: host
exp_annotations:
summary: "Host (nqn.2) was disconnected 1 times from subsystem (nqn.2016-06.io.spdk:cnode1.mygroup) in last 24 hours"
description: "Host was disconnected due to host keep alive timeout"