"expr": "",
"format": "time_series",
"intervalFactor": 2,
- "refId": "A",
- "target": ""
+ "refId": "A"
}
],
"thresholds": "",
"expr": "",
"format": "time_series",
"intervalFactor": 2,
- "refId": "A",
- "target": ""
+ "refId": "A"
}
],
"thresholds": "",
"expr": "",
"format": "time_series",
"intervalFactor": 2,
- "refId": "A",
- "target": ""
+ "refId": "A"
}
],
"thresholds": "",
"expr": "",
"format": "time_series",
"intervalFactor": 2,
- "refId": "A",
- "target": ""
+ "refId": "A"
}
],
"thresholds": "",
"expr": "",
"format": "time_series",
"intervalFactor": 2,
- "refId": "A",
- "target": ""
+ "refId": "A"
}
],
"thresholds": "",
"expr": "",
"format": "time_series",
"intervalFactor": 2,
- "refId": "A",
- "target": ""
+ "refId": "A"
}
],
"thresholds": "",
"format": "time_series",
"intervalFactor": 2,
"refId": "A",
- "target": "consolidateBy(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.health),\"max\")",
"textEditor": true
}
],
"intervalFactor": 1,
"legendFormat": "total",
"refId": "D",
- "target": "alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_mon), \"max\")),\"total\")",
"textEditor": true,
"valueHandler": "Text Only"
},
"intervalFactor": 1,
"legendFormat": "quorum",
"refId": "E",
- "target": "alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_mon_quorum), \"max\")),\"quorum\")",
"textEditor": true,
"valueHandler": "String Threshold",
"warn": "1"
"intervalFactor": 1,
"legendFormat": "down",
"refId": "A",
- "target": "alias(diffSeries(#D,#E), \"down\")",
- "targetFull": "alias(diffSeries(alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_mon), \"max\")),\"total\"),alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_mon_quorum), \"max\")),\"quorum\")), \"down\")",
"textEditor": true,
"units": "none",
"valueHandler": "Number Threshold",
"intervalFactor": 2,
"legendFormat": "total",
"refId": "E",
- "target": "alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_osd), \"max\")),\"total\")",
"textEditor": true,
"valueHandler": "Text Only"
},
"intervalFactor": 2,
"legendFormat": "up",
"refId": "F",
- "target": "alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_osd_up), \"max\")),\"up\")",
"textEditor": true,
"valueHandler": "Text Only"
},
"intervalFactor": 2,
"legendFormat": "in",
"refId": "A",
- "target": "alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_osd_in), \"max\")),\"in\")",
"textEditor": true,
"valueHandler": "Text Only"
},
"intervalFactor": 2,
"legendFormat": "out",
"refId": "C",
- "target": "alias(countSeries(currentBelow(groupByNode(transformNull(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_state.*.in,99),-2,\"maxSeries\"),0.5)),\"out\")",
"textEditor": true,
"valueHandler": "Text Only"
},
"intervalFactor": 2,
"legendFormat": "down",
"refId": "B",
- "target": "alias(countSeries(currentBelow(groupByNode(transformNull(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_state.*.up,99),-2,\"maxSeries\"),0.5)),\"down\")",
"textEditor": true,
"units": "none",
"valueHandler": "Number Threshold",
"intervalFactor": 1,
"legendFormat": "total",
"refId": "A",
- "target": "alias(countSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.num_osds),\"total\")",
"textEditor": true,
"valueHandler": "Text Only"
},
"intervalFactor": 1,
"legendFormat": "up",
"refId": "B",
- "target": "alias(countSeries(currentAbove(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.num_osds,0)),\"up\")",
"textEditor": true,
"valueHandler": "Text Only"
},
"intervalFactor": 1,
"legendFormat": "down",
"refId": "C",
- "target": "alias(diffSeries(#A, #B), \"down\")",
- "targetFull": "alias(diffSeries(alias(countSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.num_osds),\"total\"), alias(countSeries(currentAbove(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.num_osds,0)),\"up\")), \"down\")",
"textEditor": true,
"units": "none",
"url": "dashboard/db/ceph-health",
"instant": true,
"intervalFactor": 2,
"refId": "A",
- "target": "alias(maxSeries(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_bytes, 1,\"maxSeries\")), \"raw capacity\")",
"textEditor": true
}
],
"instant": true,
"intervalFactor": 1,
"refId": "A",
- "target": "alias(consolidateBy(maxSeries(timeShift(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_bytes_used,\"7d\")), \"max\"),\"-$growth_window ago\")",
"textEditor": true
}
],
"intervalFactor": 1,
"legendFormat": "Active",
"refId": "B",
- "target": "alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_active), \"max\")),\"active\")",
"textEditor": true
},
{
"intervalFactor": 1,
"legendFormat": "Degraded",
"refId": "C",
- "target": "alias(diffSeries(#B,#A),\"active + degraded\")",
- "targetFull": "alias(diffSeries(alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_active), \"max\")),\"active\"),alias(keepLastValue(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_active_clean), \"max\")),\"active + clean\")),\"active + degraded\")",
"textEditor": true
},
{
"intervalFactor": 1,
"legendFormat": "Peering",
"refId": "D",
- "target": "alias(consolidateBy(maxSeries(collectd.$mon_servers.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_peering), \"max\"),\"peering\")",
"textEditor": true
},
{
"format": "time_series",
"intervalFactor": 2,
"refId": "A",
- "target": "sumSeries(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.*.recovering_bytes_per_sec,-2,\"avg\"))",
"textEditor": true
}
],
"hide": false,
"intervalFactor": 2,
"refId": "A",
- "target": "consolidateBy(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.deep_scrub),\"max\")",
"textEditor": true
}
],
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "sum(\n rate(ceph_pool_wr[$__interval])\n)\n+ \nsum(\n rate(ceph_pool_rd[$__interval])\n)",
"format": "time_series",
"groupBy": [],
"hide": false,
"intervalFactor": 1,
"legendFormat": "IOPS",
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_op_per_sec",
"policy": "default",
- "query": "SELECT mean(\"value\") FROM \"measurement\" WHERE $timeFilter GROUP BY time($__interval) fill(null)",
"rawQuery": false,
"refId": "A",
"resultFormat": "time_series",
]
],
"tags": [],
- "target": "sumSeries(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.*.op_per_sec,-2,\"maxSeries\"))",
"textEditor": true
}
],
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "sum(rate(ceph_pool_wr_bytes[$__interval]) + rate(ceph_pool_rd_bytes[$__interval]))",
"format": "time_series",
"groupBy": [],
"hide": false,
"intervalFactor": 1,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_op_per_sec",
"policy": "default",
- "query": "SELECT \"value\" FROM \"collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_bytes_sec\" WHERE $timeFilter",
"rawQuery": true,
"refId": "A",
"resultFormat": "time_series",
]
],
"tags": [],
- "target": "sumSeries(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.*.bytes_sec,-2,\"maxSeries\"))",
"textEditor": true
}
],
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "count(ceph_pool_metadata)",
"format": "time_series",
"groupBy": [],
"intervalFactor": 2,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pool",
"policy": "default",
"refId": "A",
"resultFormat": "time_series",
]
],
"tags": [],
- "target": "maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pool)",
"textEditor": true
}
],
"intervalFactor": 2,
"legendFormat": "reads",
"refId": "A",
- "target": "alias(sumSeries(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.*.read_op_per_sec,-2,\"maxSeries\")), \"Reads\")",
"textEditor": true
},
{
"intervalFactor": 2,
"legendFormat": "writes",
"refId": "B",
- "target": "alias(sumSeries(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.*.write_op_per_sec,-2,\"maxSeries\")), \"Writes\")",
"textEditor": true
}
],
"intervalFactor": 1,
"legendFormat": "commit",
"refId": "A",
- "target": "alias(percentileOfSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.apply_latency,$percentile), \"Apply Latency\")",
"textEditor": true
},
{
"intervalFactor": 1,
"legendFormat": "apply",
"refId": "B",
- "target": "alias(percentileOfSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.commitcycle_latency, $percentile), \"Commit Latency\")",
"textEditor": true
}
],
"hide": false,
"intervalFactor": 1,
"refId": "A",
- "target": "percentileOfSeries(groupByNode(collectd.$osd_servers.$domain.cpu.percent.{system,user,wait},1,\"sumSeries\"),$percentile)",
"textEditor": true
}
],
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "quantile(\n $percentile/100, \n (\n node_memory_MemTotal{job='node'} - node_memory_MemFree{job='node'} - node_memory_Buffers{job='node'} - node_memory_Cached{job='node'}\n ) / node_memory_MemTotal{job='node'} * 100\n)",
"format": "time_series",
"groupBy": [],
"hide": false,
"intervalFactor": 2,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_op_per_sec",
"policy": "default",
- "query": "SELECT \"value\" FROM \"collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_bytes_sec\" WHERE $timeFilter",
"rawQuery": true,
"refId": "A",
"resultFormat": "time_series",
]
],
"tags": [],
- "target": "percentileOfSeries(collectd.$osd_servers.$domain.memory.percent.used,$percentile)",
"textEditor": true
}
],
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "sum(\n sum(\n rate(\n node_disk_reads_completed[$__interval]\n )\n ) by (instance,device)\n + ignoring(ceph_daemon,job) group_right(instance) ceph_disk_occupation\n)\n+\nsum(\n sum(\n rate(\n node_disk_writes_completed[$__interval]\n )\n ) by (instance,device)\n + ignoring(ceph_daemon,job) group_right(instance) ceph_disk_occupation\n)",
"format": "time_series",
"groupBy": [],
"hide": false,
"intervalFactor": 1,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_op_per_sec",
"policy": "default",
- "query": "SELECT \"value\" FROM \"collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_bytes_sec\" WHERE $timeFilter",
"rawQuery": true,
"refId": "A",
"resultFormat": "time_series",
]
],
"tags": [],
- "target": "alias(sumSeries(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.iops),\"IOPS\")",
"textEditor": true
}
],
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "# should only include OSD hosts\nsum(\n sum(\n rate(\n node_disk_bytes_read[$__interval]\n )\n ) by (instance,device)\n + ignoring(ceph_daemon,job) group_right(instance) ceph_disk_occupation\n)\n+\nsum(\n sum(\n rate(\n node_disk_bytes_written[$__interval]\n )\n ) by (instance,device)\n + ignoring(ceph_daemon,job) group_right(instance) ceph_disk_occupation\n)",
"format": "time_series",
"groupBy": [],
"hide": false,
"intervalFactor": 1,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_op_per_sec",
"policy": "default",
- "query": "SELECT \"value\" FROM \"collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_bytes_sec\" WHERE $timeFilter",
"rawQuery": true,
"refId": "A",
"resultFormat": "time_series",
]
],
"tags": [],
- "target": "sumSeries(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.bytes_per_sec)",
"textEditor": true
},
{
- "dsType": "influxdb",
"expr": "# will include non-OSD hosts\nsum(\n rate(\n node_disk_bytes_read[$__interval]\n ) + \n rate(\n node_disk_bytes_written[$__interval]\n )\n)",
"format": "time_series",
"groupBy": [],
"hide": true,
"intervalFactor": 1,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_op_per_sec",
"policy": "default",
- "query": "SELECT \"value\" FROM \"collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.pools._all_.read_bytes_sec\" WHERE $timeFilter",
"rawQuery": true,
"refId": "B",
"resultFormat": "time_series",
]
],
"tags": [],
- "target": "sumSeries(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.bytes_per_sec)",
"textEditor": true
}
],
"format": "time_series",
"intervalFactor": 2,
"refId": "A",
- "target": "countSeries(currentAbove(transformNull(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.osd_percent_used),0),$disk_full_threshold))",
"textEditor": true
}
],
"intervalFactor": 1,
"legendFormat": "average",
"refId": "A",
- "target": "alias(averageSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.util), 'average %util')",
"textEditor": false
},
{
"format": "time_series",
"intervalFactor": 1,
"legendFormat": "$percentile%ile",
- "refId": "B",
- "target": "alias(percentileOfSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.util, $percentile, 'false'), '%util @ $percentile%ile')"
+ "refId": "B"
}
],
"thresholds": [],
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "count(ceph_mon_metadata)",
"format": "time_series",
"groupBy": [],
"instant": true,
"intervalFactor": 1,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pool",
"policy": "default",
"refId": "A",
"resultFormat": "time_series",
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "count(ceph_mds_metadata)",
"format": "time_series",
"groupBy": [],
"instant": true,
"intervalFactor": 1,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pool",
"policy": "default",
"refId": "A",
"resultFormat": "time_series",
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "count(max by (id) (ceph_osd_metadata))",
"format": "time_series",
"groupBy": [],
"intervalFactor": 2,
"legendFormat": "",
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pool",
"policy": "default",
"refId": "A",
"resultFormat": "time_series",
"tableColumn": "",
"targets": [
{
- "dsType": "influxdb",
"expr": "count(ceph_pool_metadata)",
"format": "time_series",
"groupBy": [],
"intervalFactor": 2,
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pool",
"policy": "default",
"refId": "A",
"resultFormat": "time_series",
"targets": [
{
"alias": "Used",
- "dsType": "influxdb",
"expr": "scalar(ceph_cluster_total_used_bytes)",
"format": "time_series",
"groupBy": [],
"intervalFactor": 2,
"legendFormat": "Used",
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.osd_bytes_used",
"policy": "default",
"refId": "B",
"resultFormat": "time_series",
},
{
"alias": "Raw Capacity",
- "dsType": "influxdb",
"expr": "scalar(ceph_cluster_total_bytes)",
"format": "time_series",
"groupBy": [],
"intervalFactor": 2,
"legendFormat": "Raw",
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.osd_bytes",
"policy": "default",
"refId": "A",
"resultFormat": "time_series",
"targets": [
{
"alias": "Used",
- "dsType": "influxdb",
"expr": "max by (name) (\n ceph_pool_bytes_used / (ceph_pool_bytes_used + ceph_pool_max_avail) * 100 + on (pool_id) group_left (name) ceph_pool_metadata\n)",
"format": "time_series",
"groupBy": [],
"targets": [
{
"alias": "Used",
- "dsType": "influxdb",
"expr": "scalar(ceph_cluster_total_objects)",
"format": "time_series",
"groupBy": [],
"intervalFactor": 2,
"legendFormat": "RADOS Objects",
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.osd_bytes_used",
"policy": "default",
"refId": "B",
"resultFormat": "time_series",
],
"repeat": "mon_servers",
"repeatDirection": "v",
- "scopedVars": {
- "mon_servers": {
- "selected": false,
- "text": "mon.rhs-cli-04",
- "value": "mon.rhs-cli-04"
- }
- },
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"repeatDirection": "v",
"repeatIteration": 1526963039202,
"repeatPanelId": 28,
- "scopedVars": {
- "mon_servers": {
- "selected": false,
- "text": "mon.rhs-cli-05",
- "value": "mon.rhs-cli-05"
- }
- },
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"repeatDirection": "v",
"repeatIteration": 1526963039202,
"repeatPanelId": 28,
- "scopedVars": {
- "mon_servers": {
- "selected": false,
- "text": "mon.rhs-cli-06",
- "value": "mon.rhs-cli-06"
- }
- },
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"targets": [
{
"alias": "Objects",
- "dsType": "influxdb",
"expr": "ceph_cluster_total_objects",
"format": "time_series",
"groupBy": [
],
"intervalFactor": 1,
"legendFormat": "Total Objects",
- "measurement": "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object",
"policy": "default",
"refId": "A",
"resultFormat": "time_series",
"intervalFactor": 1,
"legendFormat": "{{name}}",
"refId": "A",
- "target": "groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.$pool_name.bytes_sec,-2,\"maxSeries\")",
"textEditor": true
}
],
"instant": true,
"intervalFactor": 2,
"refId": "A",
- "target": "limit(sortByMaxima(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.*.op_per_sec,-2,\"maxSeries\")),5)",
"textEditor": true
}
],
"instant": true,
"intervalFactor": 2,
"refId": "A",
- "target": "limit(sortByMaxima(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.*.bytes_sec,-2,\"maxSeries\")),5)",
"textEditor": true
}
],
"pointradius": 5,
"points": false,
"renderer": "flot",
- "scopedVars": {
- "pool_name": {
- "selected": false,
- "text": ".rgw.root",
- "value": ".rgw.root"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"stack": true,
"format": "time_series",
"intervalFactor": 1,
"legendFormat": "reads",
- "refId": "B",
- "target": "aliasByNode(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.$pool_name.write_op_per_sec), -1)"
+ "refId": "B"
},
{
"expr": "(label_replace(irate(ceph_pool_wr[1m]),\"id\",\"$1\",\"pool_id\",\"(.*)\") * on(pool_id) group_left(instance,name) ceph_pool_metadata{name=~\"[[pool_name]]\"})",
"format": "time_series",
"intervalFactor": 1,
"legendFormat": "writes",
- "refId": "C",
- "target": "aliasByNode(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.$pool_name.write_op_per_sec), -1)"
+ "refId": "C"
}
],
"thresholds": [],
"pointradius": 5,
"points": false,
"renderer": "flot",
- "scopedVars": {
- "pool_name": {
- "selected": false,
- "text": ".rgw.root",
- "value": ".rgw.root"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"stack": true,
"format": "time_series",
"intervalFactor": 1,
"legendFormat": "reads",
- "refId": "A",
- "target": "aliasByNode(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.$pool_name.read_bytes_sec), -1)"
+ "refId": "A"
},
{
"expr": "(label_replace(irate(ceph_pool_wr_bytes[1m]),\"id\",\"$1\",\"pool_id\",\"(.*)\") + on(pool_id) group_left(instance,name) ceph_pool_metadata{name=~\"[[pool_name]]\"})",
"format": "time_series",
"intervalFactor": 1,
"legendFormat": "writes",
- "refId": "C",
- "target": "aliasByNode(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.pools.$pool_name.read_bytes_sec), -1)"
+ "refId": "C"
}
],
"thresholds": [],
"pointradius": 5,
"points": false,
"renderer": "flot",
- "scopedVars": {
- "rgw_servers": {
- "selected": false,
- "text": "rgw.rhs-srv-01",
- "value": "rgw.rhs-srv-01"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"stack": true,
"pointradius": 5,
"points": false,
"renderer": "flot",
- "scopedVars": {
- "rgw_servers": {
- "selected": false,
- "text": "rgw.rhs-srv-01",
- "value": "rgw.rhs-srv-01"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"stack": true,
"maxDataPoints": 3,
"nullPointMode": "connected",
"pieType": "pie",
- "scopedVars": {
- "rgw_servers": {
- "selected": false,
- "text": "rgw.rhs-srv-01",
- "value": "rgw.rhs-srv-01"
- }
- },
"strokeWidth": 1,
"targets": [
{
"intervalFactor": 1,
"legendFormat": "{{host}}",
"refId": "A",
- "target": "groupByNode(collectd.$osd_servers.$domain.cephmetrics.gauge.$ceph_cluster.osd.*.perf.util,1,\"maxSeries\")",
"textEditor": true
}
],
"points": false,
"renderer": "flot",
"repeat": "osd_servers",
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "apama002",
- "value": "apama002"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira019",
- "value": "mira019"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira021",
- "value": "mira021"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira031",
- "value": "mira031"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira049",
- "value": "mira049"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira055",
- "value": "mira055"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira060",
- "value": "mira060"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira070",
- "value": "mira070"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira076",
- "value": "mira076"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira087",
- "value": "mira087"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira093",
- "value": "mira093"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira099",
- "value": "mira099"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira116",
- "value": "mira116"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira120",
- "value": "mira120"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "mira122",
- "value": "mira122"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
"repeat": null,
"repeatIteration": 1519090074308,
"repeatPanelId": 4,
- "scopedVars": {
- "osd_servers": {
- "selected": false,
- "text": "reesi001",
- "value": "reesi001"
- }
- },
"seriesOverrides": [],
"spaceLength": 10,
"span": 2,
},
"timezone": "",
"title": "Disk Busy By Server"
-}
\ No newline at end of file
+}
{
"__requires": [
{
- "type": "grafana",
- "id": "grafana",
- "name": "Grafana",
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
"version": "4.6.3"
- },
+ },
{
- "type": "panel",
- "id": "graph",
- "name": "Graph",
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
"version": ""
- },
+ },
{
- "type": "datasource",
- "id": "prometheus",
- "name": "Local",
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Local",
"version": "1.0.0"
}
- ],
+ ],
"annotations": {
"list": [
{
- "builtIn": 1,
- "datasource": "-- Grafana --",
- "enable": true,
- "hide": true,
- "iconColor": "rgba(0, 211, 255, 1)",
- "name": "Annotations & Alerts",
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
"type": "dashboard"
}
]
- },
- "editable": true,
- "gnetId": null,
- "graphTooltip": 0,
- "hideControls": false,
- "id": null,
- "links": [],
- "refresh": "15s",
+ },
+ "editable": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "hideControls": false,
+ "id": null,
+ "links": [],
+ "refresh": "15s",
"rows": [
{
- "collapse": false,
- "height": "250px",
+ "collapse": false,
+ "height": "250px",
"panels": [
{
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": null,
- "fill": 1,
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": null,
+ "fill": 1,
"gridPos": {
- "h": 10,
- "w": 24,
- "x": 0,
+ "h": 10,
+ "w": 24,
+ "x": 0,
"y": 0
- },
- "height": "400",
- "id": 1,
+ },
+ "height": "400",
+ "id": 1,
"legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
"values": false
- },
- "lines": true,
- "linewidth": 1,
- "links": [],
- "minSpan": 12,
- "nullPointMode": "connected",
- "percentage": false,
- "pointradius": 5,
- "points": false,
- "renderer": "flot",
- "repeat": null,
- "seriesOverrides": [],
- "spaceLength": 10,
- "span": 12,
- "stack": true,
- "steppedLine": false,
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "minSpan": 12,
+ "nullPointMode": "connected",
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "repeat": null,
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "span": 12,
+ "stack": true,
+ "steppedLine": false,
"targets": [
{
- "expr": "label_replace(irate(node_disk_reads_completed[1m]) + irate(node_disk_writes_completed{instance=~\"[[osd_servers]].*\"}[1m]),\"host\",\"$1\",\"instance\",\"([^.]*).*\")",
- "format": "time_series",
- "hide": true,
- "intervalFactor": 1,
- "legendFormat": "{{host}}",
+ "expr": "label_replace(irate(node_disk_reads_completed[1m]) + irate(node_disk_writes_completed{instance=~\"[[osd_servers]].*\"}[1m]),\"host\",\"$1\",\"instance\",\"([^.]*).*\")",
+ "format": "time_series",
+ "hide": true,
+ "intervalFactor": 1,
+ "legendFormat": "{{host}}",
"refId": "B"
- },
+ },
{
- "expr": "sum(\n sum(\n irate(node_disk_reads_completed{job=\"node\" }[1m]) + \n irate(node_disk_writes_completed{job=\"node\"}[1m]))\n by(instance, device) + ignoring(ceph_daemon,job) group_right(instance) ceph_disk_occupation)\n by(instance)",
- "format": "time_series",
- "intervalFactor": 1,
- "legendFormat": "{{instance}}",
+ "expr": "sum(\n sum(\n irate(node_disk_reads_completed{job=\"node\" }[1m]) + \n irate(node_disk_writes_completed{job=\"node\"}[1m]))\n by(instance, device) + ignoring(ceph_daemon,job) group_right(instance) ceph_disk_occupation)\n by(instance)",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{instance}}",
"refId": "A"
}
- ],
- "thresholds": [],
- "timeFrom": null,
- "timeShift": null,
- "title": "Disk IOPS Across All OSD Hosts",
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeShift": null,
+ "title": "Disk IOPS Across All OSD Hosts",
"tooltip": {
- "shared": true,
- "sort": 0,
+ "shared": true,
+ "sort": 0,
"value_type": "individual"
- },
- "type": "graph",
+ },
+ "type": "graph",
"xaxis": {
- "buckets": null,
- "mode": "time",
- "name": null,
- "show": true,
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
"values": []
- },
+ },
"yaxes": [
{
- "format": "none",
- "label": "",
- "logBase": 1,
- "max": null,
- "min": "0",
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
"show": true
- },
+ },
{
- "format": "short",
- "label": null,
- "logBase": 1,
- "max": null,
- "min": null,
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
"show": true
}
]
}
- ],
- "repeat": null,
- "repeatIteration": null,
- "repeatRowId": null,
- "showTitle": true,
- "title": "All Servers by IOPS",
+ ],
+ "repeat": null,
+ "repeatIteration": null,
+ "repeatRowId": null,
+ "showTitle": true,
+ "title": "All Servers by IOPS",
"titleSize": "h6"
- },
+ },
{
- "collapse": false,
- "height": 250,
+ "collapse": false,
+ "height": 250,
"panels": [
{
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": null,
- "fill": 1,
- "id": 2,
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": null,
+ "fill": 1,
+ "id": 2,
"legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": false,
- "total": false,
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
"values": false
- },
- "lines": true,
- "linewidth": 1,
- "links": [],
- "nullPointMode": "null",
- "percentage": false,
- "pointradius": 5,
- "points": false,
- "renderer": "flot",
- "repeat": "osd_servers",
- "seriesOverrides": [],
- "spaceLength": 10,
- "span": 4,
- "stack": false,
- "steppedLine": false,
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "repeat": "osd_servers",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "span": 4,
+ "stack": false,
+ "steppedLine": false,
"targets": [
{
- "expr": "sum(\n sum(\n irate(node_disk_reads_completed{instance=~\"[[osd_servers]].*\"}[1m]) + irate(node_disk_writes_completed[1m]))\n by(instance,device) +\n ignoring(ceph_daemon,job) group_right(instance) ceph_disk_occupation)\n \n \n",
- "format": "time_series",
- "intervalFactor": 2,
+ "expr": "sum(\n sum(\n irate(node_disk_reads_completed{instance=~\"[[osd_servers]].*\"}[1m]) + irate(node_disk_writes_completed[1m]))\n by(instance,device) +\n ignoring(ceph_daemon,job) group_right(instance) ceph_disk_occupation)\n \n \n",
+ "format": "time_series",
+ "intervalFactor": 2,
"refId": "A"
}
- ],
- "thresholds": [],
- "timeFrom": null,
- "timeShift": null,
- "title": "Total IOPS for $osd_servers",
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeShift": null,
+ "title": "Total IOPS for $osd_servers",
"tooltip": {
- "shared": true,
- "sort": 0,
+ "shared": true,
+ "sort": 0,
"value_type": "individual"
- },
- "type": "graph",
+ },
+ "type": "graph",
"xaxis": {
- "buckets": null,
- "mode": "time",
- "name": null,
- "show": true,
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
"values": []
- },
+ },
"yaxes": [
{
- "format": "none",
- "label": null,
- "logBase": 1,
- "max": null,
- "min": null,
+ "format": "none",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
"show": true
- },
+ },
{
- "format": "short",
- "label": null,
- "logBase": 1,
- "max": null,
- "min": null,
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
"show": true
}
]
}
- ],
- "repeat": null,
- "repeatIteration": null,
- "repeatRowId": null,
- "showTitle": true,
- "title": "IOPS Load by Server",
+ ],
+ "repeat": null,
+ "repeatIteration": null,
+ "repeatRowId": null,
+ "showTitle": true,
+ "title": "IOPS Load by Server",
"titleSize": "h6"
}
- ],
- "schemaVersion": 14,
- "style": "dark",
- "tags": [],
+ ],
+ "schemaVersion": 14,
+ "style": "dark",
+ "tags": [],
"templating": {
"list": [
{
- "allValue": "",
- "current": {},
- "datasource": null,
- "hide": 2,
- "includeAll": true,
- "label": "OSD Host",
- "multi": false,
- "name": "osd_servers",
- "options": [],
- "query": "label_values(ceph_disk_occupation, instance)",
- "refresh": 1,
- "regex": "([^.]*).*",
- "sort": 1,
- "tagValuesQuery": "",
- "tags": [],
- "tagsQuery": "",
- "type": "query",
+ "allValue": "",
+ "current": {},
+ "datasource": null,
+ "hide": 2,
+ "includeAll": true,
+ "label": "OSD Host",
+ "multi": false,
+ "name": "osd_servers",
+ "options": [],
+ "query": "label_values(ceph_disk_occupation, instance)",
+ "refresh": 1,
+ "regex": "([^.]*).*",
+ "sort": 1,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
"useTags": false
}
]
- },
+ },
"time": {
- "from": "now-1h",
+ "from": "now-1h",
"to": "now"
- },
+ },
"timepicker": {
"refresh_intervals": [
- "5s",
- "10s",
- "15s",
- "30s",
- "1m",
- "5m",
- "15m",
- "30m",
- "1h",
- "2h",
+ "5s",
+ "10s",
+ "15s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
"1d"
- ],
+ ],
"time_options": [
- "5m",
- "15m",
- "1h",
- "6h",
- "12h",
- "24h",
- "2d",
- "7d",
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
"30d"
]
- },
- "timezone": "",
- "title": "IOPS by Server",
+ },
+ "timezone": "",
+ "title": "IOPS by Server",
"version": 6
-}
\ No newline at end of file
+}
"selected": true,
"text": "All",
"value": "$__all"
- },
- {
- "selected": false,
- "text": "rhs-cli-04.ceph-dev.lab.eng.rdu2.redhat.com",
- "value": "rhs-cli-04.ceph-dev.lab.eng.rdu2.redhat.com"
- },
- {
- "selected": false,
- "text": "rhs-cli-05.ceph-dev.lab.eng.rdu2.redhat.com",
- "value": "rhs-cli-05.ceph-dev.lab.eng.rdu2.redhat.com"
- },
- {
- "selected": false,
- "text": "rhs-cli-06.ceph-dev.lab.eng.rdu2.redhat.com",
- "value": "rhs-cli-06.ceph-dev.lab.eng.rdu2.redhat.com"
}
],
- "query": "rhs-cli-04.ceph-dev.lab.eng.rdu2.redhat.com,rhs-cli-05.ceph-dev.lab.eng.rdu2.redhat.com,rhs-cli-06.ceph-dev.lab.eng.rdu2.redhat.com",
+ "query": "",
"type": "custom"
},
{