From: Paul Cuzner Date: Mon, 21 Aug 2017 04:57:16 +0000 (+1200) Subject: dashboard query update to filter out old OSDs X-Git-Tag: v1.0~30^2~2 X-Git-Url: http://git-server-git.apps.pok.os.sepia.ceph.com/?a=commitdiff_plain;h=4059a948e5e6edae573a8c5d398294255edc4622;p=cephmetrics.git dashboard query update to filter out old OSDs Old OSDs will still exist in the TSDB, and could show as out or down. The update uses transformNull to pick out osds with null values and filter them out of the results shown. --- diff --git a/dashboards/current/ceph-backend-storage.json b/dashboards/current/ceph-backend-storage.json index a7a9476..8cc216a 100644 --- a/dashboards/current/ceph-backend-storage.json +++ b/dashboards/current/ceph-backend-storage.json @@ -1,37 +1,78 @@ { "dashboard" : { - "version" : 18, + "links" : [ + { + "icon" : "external link", + "keepTime" : true, + "title" : "Shortcuts", + "tags" : [ + "overview" + ], + "asDropdown" : true, + "type" : "dashboards", + "targetBlank" : true, + "includeVars" : true + } + ], + "version" : 20, + "title" : "Ceph Backend Storage", + "timezone" : "browser", + "timepicker" : { + "refresh_intervals" : [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options" : [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "time" : { + "from" : "now-1h", + "to" : "now" + }, "templating" : { "list" : [ { - "tagsQuery" : "", - "name" : "cluster_name", - "multi" : false, - "tags" : [], - "label" : null, "sort" : 0, + "tagsQuery" : "", "regex" : "", - "refresh" : 1, - "hide" : 2, - "query" : "collectd.*.$domain.cephmetrics.gauge.*", - "options" : [], + "name" : "cluster_name", "tagValuesQuery" : "", + "label" : null, "current" : { - "text" : "ceph", "value" : "ceph", + "text" : "ceph", "selected" : true }, - "allValue" : null, - "type" : "query", + "options" : [], + "multi" : false, "datasource" : "Local", "includeAll" : false, - "useTags" : false + "hide" : 2, + "query" : "collectd.*.$domain.cephmetrics.gauge.*", + "useTags" : false, + "refresh" : 1, + "allValue" : null, + "type" : "query", + "tags" : [] }, { - "type" : "custom", - "includeAll" : false, - "label" : null, - "name" : "domain", "options" : [ { "value" : "test.lab", @@ -39,273 +80,271 @@ "selected" : true } ], - "current" : { - "text" : "test.lab", - "value" : "test.lab", - "selected" : true - }, "multi" : false, - "allValue" : null, "hide" : 2, - "query" : "test.lab" + "includeAll" : false, + "query" : "test.lab", + "allValue" : null, + "type" : "custom", + "name" : "domain", + "label" : null, + "current" : { + "selected" : true, + "text" : "test.lab", + "value" : "test.lab" + } }, { - "label" : "Percentile", - "includeAll" : false, + "allValue" : null, "type" : "custom", - "hide" : 0, "query" : "80,85,90,95,98", - "allValue" : null, - "multi" : false, + "label" : "Percentile", "current" : { - "text" : "95", "value" : "95", + "text" : "95", "selected" : true }, "name" : "percentile", "options" : [ { - "value" : "80", "text" : "80", - "selected" : false + "selected" : false, + "value" : "80" }, { - "value" : "85", + "selected" : false, "text" : "85", - "selected" : false + "value" : "85" }, { - "value" : "90", + "selected" : false, "text" : "90", - "selected" : false + "value" : "90" }, { - "value" : "95", "text" : "95", - "selected" : true + "selected" : true, + "value" : "95" }, { - "selected" : false, + "value" : "98", "text" : "98", - "value" : "98" + "selected" : false } - ] + ], + "multi" : false, + "includeAll" : false, + "hide" : 0 }, { - "label" : "OSD Hostname", - "includeAll" : true, - "type" : "custom", "hide" : 0, - "query" : "ceph-1,ceph-2,ceph-3", - "allValue" : "", - "multi" : true, - "current" : { - "value" : "$__all", - "text" : "All", - "selected" : true - }, - "name" : "osd_servers", + "includeAll" : true, "options" : [ { "selected" : true, - "value" : "$__all", - "text" : "All" + "text" : "All", + "value" : "$__all" }, { "value" : "ceph-1", - "text" : "ceph-1", - "selected" : false + "selected" : false, + "text" : "ceph-1" }, { - "selected" : false, "value" : "ceph-2", + "selected" : false, "text" : "ceph-2" }, { - "value" : "ceph-3", + "selected" : false, "text" : "ceph-3", - "selected" : false + "value" : "ceph-3" } - ] + ], + "multi" : true, + "label" : "OSD Hostname", + "current" : { + "value" : "$__all", + "selected" : true, + "text" : "All" + }, + "name" : "osd_servers", + "allValue" : "", + "type" : "custom", + "query" : "ceph-1,ceph-2,ceph-3" }, { - "hide" : 2, + "type" : "custom", + "allValue" : null, "query" : "85", + "current" : { + "text" : "85", + "selected" : true, + "value" : "85" + }, + "label" : null, + "name" : "disk_full_threshold", + "multi" : false, "options" : [ { "text" : "85", - "value" : "85", - "selected" : true + "selected" : true, + "value" : "85" } ], - "name" : "disk_full_threshold", - "allValue" : null, - "multi" : false, - "current" : { - "text" : "85", - "value" : "85", - "selected" : true - }, - "label" : null, - "type" : "custom", + "hide" : 2, "includeAll" : false } ] }, + "gnetId" : null, + "style" : "dark", + "hideControls" : true, + "editable" : false, + "annotations" : { + "list" : [] + }, + "graphTooltip" : 0, + "schemaVersion" : 14, + "id" : 13, + "tags" : [], "rows" : [ { - "collapse" : false, - "repeat" : null, - "repeatIteration" : null, "panels" : [ { - "sort" : { - "col" : null, - "desc" : false - }, - "id" : 56, + "type" : "table", "minSpan" : 1, - "title" : "OSD's Down", - "links" : [], + "transform" : "timeseries_aggregations", + "id" : 56, "targets" : [ { + "target" : "currentBelow(groupByNode(transformNull(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_state.*.up,99),-2,\"maxSeries\"),0.5)", "hide" : false, - "textEditor" : true, - "target" : "currentBelow(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_state.*.up,-2,\"maxSeries\"),0.5)", - "refId" : "B" + "refId" : "B", + "textEditor" : true } ], - "hideTimeOverride" : true, - "fontSize" : "100%", - "transform" : "timeseries_aggregations", "columns" : [ { - "text" : "Current", - "value" : "current" + "value" : "current", + "text" : "Current" } ], + "showHeader" : true, + "fontSize" : "100%", "styles" : [ { - "colorMode" : null, + "thresholds" : [ + "" + ], + "type" : "number", + "sanitize" : false, + "pattern" : "Metric", "colors" : [ "rgba(50, 172, 45, 0.97)", "rgba(237, 129, 40, 0.89)", "rgba(245, 54, 54, 0.9)" ], - "pattern" : "Metric", "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "sanitize" : false, + "colorMode" : null, + "alias" : "OSD Id", "decimals" : 0, - "thresholds" : [ - "" - ], - "unit" : "short", - "type" : "number", - "alias" : "OSD Id" + "unit" : "short" }, { - "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "thresholds" : [ + "0" + ], + "type" : "hidden", "pattern" : "Current", "colors" : [ "rgba(50, 172, 45, 0.97)", "rgba(237, 129, 40, 0.89)", "rgba(245, 54, 54, 0.9)" ], + "dateFormat" : "YYYY-MM-DD HH:mm:ss", "colorMode" : "cell", "alias" : "Status", "decimals" : 0, - "thresholds" : [ - "0" - ], - "unit" : "short", - "type" : "hidden" + "unit" : "short" } ], - "timeFrom" : "1m", - "type" : "table", "pageSize" : 100, + "scroll" : true, + "title" : "OSD's Down", + "timeFrom" : "1m", "span" : 1, + "links" : [], + "sort" : { + "col" : null, + "desc" : false + }, "timeShift" : null, - "scroll" : true, - "showHeader" : true + "hideTimeOverride" : true }, { - "scroll" : true, - "showHeader" : true, - "fontSize" : "100%", - "span" : 2, "type" : "table", - "title" : "Disks Near Full", - "links" : [], + "transform" : "timeseries_aggregations", "minSpan" : 2, - "pageSize" : null, - "targets" : [ - { - "target" : "aliasByNode(currentAbove(transformNull(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.osd_percent_used),0),$disk_full_threshold),1,-2)", - "refId" : "A", - "textEditor" : true - } - ], - "id" : 57, "styles" : [ { - "type" : "date", "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "type" : "date", "alias" : "Time", "pattern" : "Time" }, { - "colorMode" : null, + "type" : "number", + "thresholds" : [], + "pattern" : "Host and Disk", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "pattern" : "Host and Disk", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "thresholds" : [], + "colorMode" : null, "decimals" : 0, - "unit" : "short", - "type" : "number", - "alias" : "% Full" + "alias" : "% Full", + "unit" : "short" }, { "unit" : "none", - "type" : "number", - "decimals" : 0, - "thresholds" : [], "alias" : "% Full", - "colors" : [ - "rgba(245, 54, 54, 0.9)", + "decimals" : 0, + "colorMode" : null, + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "colors" : [ + "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "colorMode" : null, - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "pattern" : "Current" + "pattern" : "Current", + "thresholds" : [], + "type" : "number" }, { - "unit" : "short", "type" : "number", - "decimals" : 2, "thresholds" : [], - "alias" : "Host.OSD Id", + "pattern" : "Metric", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], "colorMode" : null, - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "pattern" : "Metric" + "decimals" : 2, + "alias" : "Host.OSD Id", + "unit" : "short" }, { - "alias" : "", + "pattern" : "/.*/", "type" : "number", - "unit" : "short", "thresholds" : [], "decimals" : 2, - "pattern" : "/.*/", + "alias" : "", + "unit" : "short", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", @@ -314,963 +353,924 @@ "colorMode" : null } ], + "id" : 57, + "pageSize" : null, + "targets" : [ + { + "textEditor" : true, + "refId" : "A", + "target" : "aliasByNode(currentAbove(transformNull(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.osd_percent_used),0),$disk_full_threshold),1,-2)" + } + ], + "scroll" : true, + "title" : "Disks Near Full", "columns" : [ { - "text" : "Current", - "value" : "current" + "value" : "current", + "text" : "Current" } ], "sort" : { - "col" : 0, - "desc" : true + "desc" : true, + "col" : 0 }, - "transform" : "timeseries_aggregations" + "span" : 2, + "links" : [], + "showHeader" : true, + "fontSize" : "100%" }, { - "maxDataPoints" : "1", - "fontSize" : "100%", - "targets" : [ - { - "textEditor" : true, - "refId" : "A", - "target" : "groupByNode(keepLastValue(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.stat_bytes),1,\"sumSeries\")" - } - ], - "minSpan" : 3, + "scroll" : true, "title" : "Host OSD Raw Capacity", "links" : [], - "id" : 58, "sort" : { "col" : 0, "desc" : false }, - "showHeader" : true, - "scroll" : true, "span" : 3, - "pageSize" : null, - "type" : "table", - "columns" : [ - { - "text" : "Current", - "value" : "current" - } - ], "styles" : [ { "type" : "date", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", "pattern" : "Time", - "alias" : "Time", - "dateFormat" : "YYYY-MM-DD HH:mm:ss" + "alias" : "Time" }, { + "dateFormat" : "YYYY-MM-DD HH:mm:ss", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], "colorMode" : null, - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "pattern" : "Current", "decimals" : 2, - "thresholds" : [], + "alias" : "Total OSD Capacity", "unit" : "decbytes", "type" : "number", - "alias" : "Total OSD Capacity" + "thresholds" : [], + "pattern" : "Current" }, { - "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "thresholds" : [], + "type" : "number", "pattern" : "Metric", + "colorMode" : null, "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "colorMode" : null, + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "unit" : "short", "alias" : "Host Name", - "decimals" : 2, - "thresholds" : [], - "type" : "number", - "unit" : "short" + "decimals" : 2 }, { - "type" : "number", - "unit" : "short", - "thresholds" : [], "decimals" : 2, "alias" : "", + "unit" : "short", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], "colorMode" : null, - "pattern" : "/.*/" + "pattern" : "/.*/", + "thresholds" : [], + "type" : "number" } ], - "transform" : "timeseries_aggregations" - }, - { - "span" : 3, - "scroll" : true, + "pageSize" : null, + "targets" : [ + { + "textEditor" : true, + "refId" : "A", + "target" : "groupByNode(keepLastValue(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.stat_bytes),1,\"sumSeries\")" + } + ], + "maxDataPoints" : "1", "showHeader" : true, - "transform" : "timeseries_aggregations", + "fontSize" : "100%", "columns" : [ { "value" : "current", "text" : "Current" } ], + "type" : "table", + "minSpan" : 3, + "transform" : "timeseries_aggregations", + "id" : 58 + }, + { "styles" : [ { - "type" : "date", - "alias" : "Time", "pattern" : "Time", + "alias" : "Time", + "type" : "date", "dateFormat" : "YYYY-MM-DD HH:mm:ss" }, { - "alias" : "# OSDs", - "thresholds" : [], - "decimals" : 0, - "unit" : "none", "type" : "number", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "thresholds" : [], "pattern" : "Current", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "colorMode" : null + "colorMode" : null, + "alias" : "# OSDs", + "decimals" : 0, + "unit" : "none" }, { "pattern" : "Metric", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "colorMode" : null, + "type" : "number", + "thresholds" : [], + "alias" : "Host Name", + "decimals" : 2, + "unit" : "short", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "alias" : "Host Name", - "unit" : "short", - "type" : "number", - "thresholds" : [], - "decimals" : 2 + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "colorMode" : null }, { - "unit" : "short", - "type" : "number", - "thresholds" : [], "decimals" : 2, "alias" : "", + "unit" : "short", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], "colorMode" : null, - "pattern" : "/.*/" + "pattern" : "/.*/", + "thresholds" : [], + "type" : "number" } ], - "type" : "table", "pageSize" : null, - "fontSize" : "100%", - "maxDataPoints" : "10", + "scroll" : true, + "title" : "Host OSD Capacity Breakdown", + "span" : 3, "sort" : { "col" : 0, "desc" : false }, - "id" : 59, - "title" : "Host OSD Capacity Breakdown", - "minSpan" : 3, "links" : [], + "type" : "table", + "transform" : "timeseries_aggregations", + "minSpan" : 3, + "id" : 59, "targets" : [ { + "textEditor" : true, "refId" : "A", - "target" : "aliasByNode(keepLastValue(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.num_osds,6),1)", - "textEditor" : true + "target" : "aliasByNode(keepLastValue(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.num_osds,6),1)" + } + ], + "maxDataPoints" : "10", + "fontSize" : "100%", + "showHeader" : true, + "columns" : [ + { + "value" : "current", + "text" : "Current" } ] } ], - "height" : 250, - "title" : "Disk/OSD Host Summary", "showTitle" : true, + "repeatRowId" : null, "titleSize" : "h5", - "repeatRowId" : null + "collapse" : false, + "repeatIteration" : null, + "title" : "Disk/OSD Host Summary", + "repeat" : null, + "height" : 250 }, { - "collapse" : true, - "repeat" : null, + "height" : "300", "repeatIteration" : null, + "title" : "Disk/OSD Load Summary", + "repeat" : null, + "collapse" : true, + "repeatRowId" : null, + "titleSize" : "h5", "panels" : [ { - "yAxis" : { - "format" : "short", - "decimals" : null, - "logBase" : 1, - "max" : "100", - "show" : true, - "splitFactor" : null, - "min" : "0" - }, - "type" : "heatmap", - "yBucketSize" : 5, - "dataFormat" : "timeseries", - "color" : { - "cardColor" : "#b4ff00", - "mode" : "spectrum", - "exponent" : 0.5, - "colorScheme" : "interpolateRdYlGn", - "colorScale" : "sqrt" - }, - "xBucketNumber" : 180, + "heatmap" : {}, "span" : 6, - "description" : "The heatmap categorizes disk utilization into discrete buckets (e.g util 0-5) and shows the frequency of the number of disks that fall within that range as a color. The color chosen depends on the number of disks in the 'bucket', ranging from green (low) to red (high). Hover over a colored block to show the count of disk utilization observations at that point.", - "id" : 53, + "links" : [], "highlightCards" : true, "xAxis" : { "show" : true }, + "yBucketSize" : 5, + "title" : "Disk Drive Utilization Heatmap - $osd_servers", + "xBucketSize" : "", + "description" : "The heatmap categorizes disk utilization into discrete buckets (e.g util 0-5) and shows the frequency of the number of disks that fall within that range as a color. The color chosen depends on the number of disks in the 'bucket', ranging from green (low) to red (high). Hover over a colored block to show the count of disk utilization observations at that point.", + "cards" : { + "cardRound" : null, + "cardPadding" : null + }, "yBucketNumber" : null, + "xBucketNumber" : 180, + "dataFormat" : "timeseries", "targets" : [ { "textEditor" : true, - "target" : "collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.util", - "refId" : "A" + "refId" : "A", + "target" : "collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.util" } ], - "title" : "Disk Drive Utilization Heatmap - $osd_servers", - "links" : [], - "minSpan" : 6, - "tooltip" : { - "showHistogram" : false, + "yAxis" : { + "format" : "short", + "splitFactor" : null, + "min" : "0", + "decimals" : null, + "max" : "100", + "logBase" : 1, "show" : true }, - "xBucketSize" : "", - "heatmap" : {}, - "cards" : { - "cardPadding" : null, - "cardRound" : null - } + "id" : 53, + "color" : { + "exponent" : 0.5, + "colorScheme" : "interpolateRdYlGn", + "colorScale" : "sqrt", + "mode" : "spectrum", + "cardColor" : "#b4ff00" + }, + "type" : "heatmap", + "tooltip" : { + "show" : true, + "showHistogram" : false + }, + "minSpan" : 6 }, { - "bars" : false, - "span" : 6, + "title" : "Disk Throughput - $osd_servers", + "nullPointMode" : "null", + "dashes" : false, + "spaceLength" : 10, "renderer" : "flot", - "pointradius" : 5, + "aliasColors" : { + "Write Throughput" : "#E0752D", + "Read Throughput" : "#629E51" + }, + "points" : false, "timeShift" : null, - "steppedLine" : false, - "stack" : true, - "percentage" : false, - "dashLength" : 10, + "span" : 6, + "linewidth" : 1, + "links" : [], "timeFrom" : null, - "datasource" : "Local", - "type" : "graph", - "fill" : 1, - "legend" : { - "values" : false, - "current" : false, - "avg" : false, - "total" : false, - "show" : true, - "max" : false, - "min" : false - }, - "xaxis" : { - "buckets" : null, - "values" : [], - "name" : null, - "mode" : "time", - "show" : true - }, - "spaceLength" : 10, - "nullPointMode" : "null", - "linewidth" : 1, "yaxes" : [ { - "logBase" : 1, - "format" : "decbytes", + "min" : "0", "label" : null, + "format" : "decbytes", + "logBase" : 1, "show" : true, - "max" : null, - "min" : "0" + "max" : null }, { - "max" : null, - "label" : null, - "show" : true, "min" : null, + "label" : null, "format" : "short", - "logBase" : 1 + "show" : true, + "logBase" : 1, + "max" : null } ], - "tooltip" : { - "value_type" : "individual", - "shared" : true, - "sort" : 0 - }, - "lines" : true, - "dashes" : false, - "seriesOverrides" : [], - "aliasColors" : { - "Read Throughput" : "#629E51", - "Write Throughput" : "#E0752D" - }, - "points" : false, - "id" : 24, "thresholds" : [], + "percentage" : false, + "stack" : true, "targets" : [ { - "textEditor" : true, "target" : "alias(sumSeries(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.r_bytes_per_sec), \"Read Throughput\")", + "textEditor" : true, "refId" : "A" }, { - "refId" : "B", "target" : "alias(sumSeries(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.w_bytes_per_sec), \"Write Throughput\")", + "refId" : "B", "textEditor" : true } ], - "title" : "Disk Throughput - $osd_servers", - "links" : [], - "minSpan" : 6 - }, - { - "bars" : false, - "pointradius" : 5, - "renderer" : "flot", - "span" : 6, - "timeShift" : null, - "steppedLine" : false, - "stack" : true, "dashLength" : 10, - "percentage" : false, - "timeFrom" : null, - "type" : "graph", "datasource" : "Local", - "xaxis" : { - "values" : [], - "name" : null, - "buckets" : null, - "mode" : "time", - "show" : true - }, - "spaceLength" : 10, - "nullPointMode" : "null as zero", + "bars" : false, + "steppedLine" : false, + "fill" : 1, + "pointradius" : 5, + "seriesOverrides" : [], "legend" : { "show" : true, + "avg" : false, "max" : false, - "min" : false, "values" : false, - "avg" : false, - "current" : false, - "total" : false + "total" : false, + "min" : false, + "current" : false }, - "fill" : 1, + "minSpan" : 6, + "type" : "graph", + "tooltip" : { + "value_type" : "individual", + "shared" : true, + "sort" : 0 + }, + "id" : 24, + "xaxis" : { + "mode" : "time", + "show" : true, + "name" : null, + "buckets" : null, + "values" : [] + }, + "lines" : true + }, + { "yaxes" : [ { - "min" : "0", "max" : null, + "logBase" : 1, "show" : true, - "label" : null, + "min" : "0", "format" : "ms", - "logBase" : 1 + "label" : null }, { - "format" : "short", - "logBase" : 1, "max" : null, + "logBase" : 1, "show" : true, - "label" : null, - "min" : null + "format" : "short", + "min" : null, + "label" : null + } + ], + "timeFrom" : null, + "links" : [ + { + "keepTime" : true, + "targetBlank" : true, + "type" : "dashboard", + "title" : "Latency by Server", + "dashUri" : "db/latency-by-server", + "includeVars" : true, + "dashboard" : "Latency by Server" } ], + "span" : 6, "linewidth" : 1, - "dashes" : false, - "lines" : true, - "tooltip" : { - "sort" : 0, - "shared" : true, - "value_type" : "individual" - }, + "timeShift" : null, + "points" : false, "aliasColors" : { "Read Latency" : "#629E51", "Write Latency" : "#E0752D" }, - "seriesOverrides" : [], - "points" : false, - "id" : 40, + "dashes" : false, + "spaceLength" : 10, + "renderer" : "flot", + "nullPointMode" : "null as zero", "title" : "Disk Latency - $osd_servers OSDs @ $percentile%ile", - "minSpan" : 6, - "links" : [ + "percentage" : false, + "thresholds" : [ { - "dashboard" : "Latency by Server", - "keepTime" : true, - "targetBlank" : true, - "dashUri" : "db/latency-by-server", - "includeVars" : true, - "type" : "dashboard", - "title" : "Latency by Server" + "value" : 50, + "op" : "gt", + "fill" : false, + "lineColor" : "rgba(178, 0, 0, 0.29)", + "line" : true, + "colorMode" : "custom" } ], + "fill" : 1, + "steppedLine" : false, + "datasource" : "Local", + "bars" : false, + "dashLength" : 10, "targets" : [ { - "textEditor" : true, + "target" : "alias(percentileOfSeries(group(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.r_await),$percentile), \"Read Latency\")", "refId" : "A", - "target" : "alias(percentileOfSeries(group(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.r_await),$percentile), \"Read Latency\")" + "textEditor" : true }, { "textEditor" : true, - "target" : "alias(percentileOfSeries(group(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.w_await),$percentile), \"Write Latency\")", - "refId" : "C" + "refId" : "C", + "target" : "alias(percentileOfSeries(group(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.w_await),$percentile), \"Write Latency\")" } ], - "thresholds" : [ - { - "op" : "gt", - "colorMode" : "custom", - "lineColor" : "rgba(178, 0, 0, 0.29)", - "fill" : false, - "line" : true, - "value" : 50 - } - ] - }, - { - "fill" : 1, - "spaceLength" : 10, + "stack" : true, + "lines" : true, "xaxis" : { - "name" : null, - "values" : [], - "buckets" : null, "mode" : "time", - "show" : true - }, - "nullPointMode" : "null", - "legend" : { "show" : true, - "max" : false, - "min" : false, - "values" : true, - "current" : true, - "avg" : false, - "total" : false + "buckets" : null, + "name" : null, + "values" : [] }, + "id" : 40, "tooltip" : { - "sort" : 0, "shared" : true, + "sort" : 0, "value_type" : "individual" }, - "lines" : true, - "dashes" : false, - "linewidth" : 1, + "type" : "graph", + "minSpan" : 6, + "legend" : { + "max" : false, + "show" : true, + "avg" : false, + "current" : false, + "total" : false, + "min" : false, + "values" : false + }, + "seriesOverrides" : [], + "pointradius" : 5 + }, + { "yaxes" : [ { + "max" : "100", + "show" : true, "logBase" : 1, + "min" : "0", "format" : "short", - "label" : "", - "show" : true, - "max" : "100", - "min" : "0" + "label" : "" }, { - "format" : "short", "logBase" : 1, - "max" : null, "show" : false, + "max" : null, + "min" : null, "label" : null, - "min" : null + "format" : "short" } ], - "seriesOverrides" : [], + "timeFrom" : null, + "linewidth" : 1, + "span" : 6, + "links" : [ + { + "includeVars" : true, + "dashUri" : "db/disk-busy-by-server", + "dashboard" : "Disk Busy by Server", + "title" : "Disk Busy by Server", + "type" : "dashboard", + "targetBlank" : true, + "keepTime" : true + } + ], + "timeShift" : null, + "points" : false, "aliasColors" : { "disk busy %" : "#3F6833" }, + "spaceLength" : 10, + "dashes" : false, + "renderer" : "flot", + "title" : "Disk Utilization - $osd_servers OSDs at $percentile%ile", + "nullPointMode" : "null", + "percentage" : false, "thresholds" : [ { + "line" : true, "colorMode" : "custom", + "lineColor" : "rgba(178, 0, 0, 0.29)", "op" : "gt", - "value" : 80, "fill" : false, - "line" : true, - "lineColor" : "rgba(178, 0, 0, 0.29)" + "value" : 80 } ], + "fill" : 1, + "steppedLine" : false, + "datasource" : "Local", + "bars" : false, + "dashLength" : 10, "targets" : [ { "refId" : "A", - "target" : "alias(percentileOfSeries(group(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.util),$percentile), \"disk busy %\")", - "textEditor" : true + "textEditor" : true, + "target" : "alias(percentileOfSeries(group(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.util),$percentile), \"disk busy %\")" } ], - "minSpan" : 6, - "title" : "Disk Utilization - $osd_servers OSDs at $percentile%ile", - "links" : [ - { - "dashUri" : "db/disk-busy-by-server", - "targetBlank" : true, - "keepTime" : true, - "dashboard" : "Disk Busy by Server", - "type" : "dashboard", - "title" : "Disk Busy by Server", - "includeVars" : true - } - ], - "id" : 43, - "points" : false, - "span" : 6, - "renderer" : "flot", - "pointradius" : 5, - "bars" : false, - "steppedLine" : false, - "timeShift" : null, - "percentage" : false, - "dashLength" : 10, "stack" : false, - "datasource" : "Local", + "lines" : true, + "xaxis" : { + "show" : true, + "mode" : "time", + "values" : [], + "name" : null, + "buckets" : null + }, + "id" : 43, + "tooltip" : { + "value_type" : "individual", + "sort" : 0, + "shared" : true + }, "type" : "graph", - "timeFrom" : null + "minSpan" : 6, + "legend" : { + "values" : true, + "total" : false, + "min" : false, + "current" : true, + "show" : true, + "avg" : false, + "max" : false + }, + "pointradius" : 5, + "seriesOverrides" : [] }, { - "timeShift" : null, - "steppedLine" : false, - "bars" : false, - "pointradius" : 5, + "spaceLength" : 10, + "dashes" : false, "renderer" : "flot", + "title" : "IOPS per Disk @ $percentile%ile - $osd_servers OSDs", + "nullPointMode" : "null", + "points" : false, + "aliasColors" : { + "IOPS/spindle" : "#3F6833" + }, "span" : 6, + "links" : [], + "linewidth" : 1, + "timeShift" : null, "timeFrom" : null, - "type" : "graph", - "datasource" : "Local", - "stack" : false, - "dashLength" : 10, - "percentage" : false, "yaxes" : [ { - "format" : "short", - "logBase" : 1, "max" : null, "show" : true, - "label" : null, - "min" : "0" + "logBase" : 1, + "format" : "short", + "min" : "0", + "label" : null }, { + "label" : null, + "min" : null, "format" : "short", - "logBase" : 1, "max" : null, - "show" : true, - "label" : null, - "min" : null + "logBase" : 1, + "show" : true } ], - "linewidth" : 1, - "lines" : true, - "dashes" : false, - "tooltip" : { - "value_type" : "individual", - "shared" : true, - "sort" : 0 - }, - "spaceLength" : 10, - "xaxis" : { - "mode" : "time", - "show" : true, - "name" : null, - "values" : [], - "buckets" : null - }, - "legend" : { - "values" : false, - "total" : false, - "avg" : false, - "current" : false, - "max" : false, - "show" : false, - "min" : false - }, - "nullPointMode" : "null", - "fill" : 1, - "id" : 46, - "points" : false, - "title" : "IOPS per Disk @ $percentile%ile - $osd_servers OSDs", - "minSpan" : 6, - "links" : [], "thresholds" : [], + "percentage" : false, + "dashLength" : 10, "targets" : [ { - "textEditor" : true, "target" : "alias(percentileOfSeries(group(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.iops),$percentile),\"IOPS/spindle\")", + "textEditor" : true, "refId" : "A" } ], - "aliasColors" : { - "IOPS/spindle" : "#3F6833" - }, - "seriesOverrides" : [] - }, - { - "xaxis" : { - "values" : [], - "buckets" : null, - "name" : null, - "mode" : "time", - "show" : true - }, - "spaceLength" : 10, + "stack" : false, + "steppedLine" : false, + "datasource" : "Local", + "bars" : false, + "fill" : 1, "legend" : { - "values" : false, + "min" : false, "total" : false, "current" : false, - "avg" : false, + "values" : false, "max" : false, "show" : false, - "min" : false + "avg" : false }, - "nullPointMode" : "null", - "fill" : 1, - "dashes" : false, - "lines" : true, + "seriesOverrides" : [], + "pointradius" : 5, + "type" : "graph", "tooltip" : { "shared" : true, "sort" : 0, "value_type" : "individual" }, - "yaxes" : [ - { - "min" : "0", - "max" : null, - "label" : null, - "show" : true, - "format" : "short", - "logBase" : 1 - }, - { - "min" : null, - "label" : null, - "show" : false, - "max" : null, - "logBase" : 1, - "format" : "short" - } - ], - "linewidth" : 1, + "minSpan" : 6, + "id" : 46, + "lines" : true, + "xaxis" : { + "values" : [], + "name" : null, + "buckets" : null, + "show" : true, + "mode" : "time" + } + }, + { + "thresholds" : [], + "percentage" : false, + "spaceLength" : 10, + "renderer" : "flot", + "dashes" : false, + "nullPointMode" : "null", + "title" : "Total Disk IOPS - $osd_servers OSDs", + "points" : false, "aliasColors" : { "IOPS" : "#3F6833" }, - "seriesOverrides" : [], - "title" : "Total Disk IOPS - $osd_servers OSDs", + "span" : 6, "links" : [ { - "targetBlank" : true, - "keepTime" : true, "dashboard" : "IOPS by Server", - "dashUri" : "db/iops-by-server", "includeVars" : true, + "dashUri" : "db/iops-by-server", + "title" : "IOPS by Server", "type" : "dashboard", - "title" : "IOPS by Server" + "keepTime" : true, + "targetBlank" : true } ], - "minSpan" : 6, - "thresholds" : [], - "targets" : [ + "linewidth" : 1, + "timeShift" : null, + "yaxes" : [ { - "textEditor" : true, - "target" : "alias(sumSeries(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.iops),\"IOPS\")", - "refId" : "A" + "label" : null, + "min" : "0", + "format" : "short", + "max" : null, + "logBase" : 1, + "show" : true + }, + { + "label" : null, + "min" : null, + "format" : "short", + "max" : null, + "show" : false, + "logBase" : 1 } ], - "points" : false, - "id" : 47, + "timeFrom" : null, + "legend" : { + "min" : false, + "total" : false, + "current" : false, + "values" : false, + "max" : false, + "avg" : false, + "show" : false + }, + "seriesOverrides" : [], "pointradius" : 5, - "renderer" : "flot", - "span" : 6, - "bars" : false, - "steppedLine" : false, - "timeShift" : null, - "dashLength" : 10, - "percentage" : false, - "stack" : false, - "datasource" : "Local", "type" : "graph", - "timeFrom" : null - } - ], - "height" : "300", - "title" : "Disk/OSD Load Summary", - "showTitle" : true, - "titleSize" : "h5", - "repeatRowId" : null - }, - { - "repeat" : null, - "repeatIteration" : null, - "collapse" : true, - "showTitle" : true, - "titleSize" : "h5", - "repeatRowId" : null, - "panels" : [ - { - "points" : false, - "id" : 44, + "tooltip" : { + "shared" : true, + "sort" : 0, + "value_type" : "individual" + }, "minSpan" : 6, - "title" : "CPU Utilization - $osd_servers", - "links" : [], - "thresholds" : [], + "id" : 47, + "lines" : true, + "xaxis" : { + "mode" : "time", + "show" : true, + "name" : null, + "buckets" : null, + "values" : [] + }, "targets" : [ { + "refId" : "A", "textEditor" : true, - "target" : "alias(percentileOfSeries(groupByNode(collectd.*.$domain.cpu.percent.{wait,interrupt,nice,user,system}, 1, \"sumSeries\"),$percentile),\"Cluster-wide CPU Busy @ $percentile%ile\")", - "refId" : "A" - }, - { - "textEditor" : true, - "hide" : false, - "target" : "alias(averageSeries(groupByNode(collectd.$osd_servers.$domain.cpu.percent.{wait,interrupt,nice,user,system}, 1, \"sumSeries\")),\"Average OSD Host(s) CPU Busy\")", - "refId" : "B" + "target" : "alias(sumSeries(collectd.$osd_servers.$domain.cephmetrics.gauge.$cluster_name.osd.*.perf.iops),\"IOPS\")" } ], + "dashLength" : 10, + "stack" : false, + "steppedLine" : false, + "bars" : false, + "datasource" : "Local", + "fill" : 1 + } + ], + "showTitle" : true + }, + { + "panels" : [ + { + "thresholds" : [], + "percentage" : false, + "points" : false, "aliasColors" : { + "Max CPU Busy - all OSD Hosts" : "#BF1B00", "CPU Busy" : "#447EBC", "CPU Busy @ 95%ile" : "#890F02", - "Cluster-wide CPU Busy @ 95%ile" : "#890F02", "Max CPU Busy" : "#BF1B00", - "Max CPU Busy - all OSD Hosts" : "#BF1B00" + "Cluster-wide CPU Busy @ 95%ile" : "#890F02" }, - "seriesOverrides" : [ - { - "alias" : "Cluster-wide CPU Busy @ 95%ile", - "fill" : 0 - } - ], + "dashes" : false, + "spaceLength" : 10, + "renderer" : "flot", + "title" : "CPU Utilization - $osd_servers", + "nullPointMode" : "null as zero", + "timeFrom" : null, "yaxes" : [ { - "max" : "100", - "label" : "", - "show" : true, "min" : "0", + "label" : "", "format" : "short", - "logBase" : 1 + "max" : "100", + "logBase" : 1, + "show" : true }, { + "format" : "short", + "min" : null, "label" : null, - "show" : true, "max" : null, - "min" : null, "logBase" : 1, - "format" : "short" + "show" : true } ], + "span" : 6, + "links" : [], "linewidth" : 1, - "lines" : true, - "dashes" : false, + "timeShift" : null, + "type" : "graph", "tooltip" : { "value_type" : "individual", - "sort" : 0, - "shared" : true - }, - "xaxis" : { - "show" : true, - "mode" : "time", - "values" : [], - "name" : null, - "buckets" : null + "shared" : true, + "sort" : 0 }, - "nullPointMode" : "null as zero", - "spaceLength" : 10, + "minSpan" : 6, "legend" : { - "total" : false, - "avg" : false, - "current" : false, "values" : false, + "current" : false, "min" : false, - "max" : false, - "show" : true + "total" : false, + "avg" : false, + "show" : true, + "max" : false }, - "fill" : 3, - "timeFrom" : null, - "datasource" : "Local", - "type" : "graph", - "stack" : false, + "pointradius" : 5, + "seriesOverrides" : [ + { + "fill" : 0, + "alias" : "Cluster-wide CPU Busy @ 95%ile" + } + ], + "lines" : true, + "xaxis" : { + "mode" : "time", + "show" : true, + "buckets" : null, + "name" : null, + "values" : [] + }, + "id" : 44, "dashLength" : 10, - "percentage" : false, - "timeShift" : null, + "targets" : [ + { + "target" : "alias(percentileOfSeries(groupByNode(collectd.*.$domain.cpu.percent.{wait,interrupt,nice,user,system}, 1, \"sumSeries\"),$percentile),\"Cluster-wide CPU Busy @ $percentile%ile\")", + "refId" : "A", + "textEditor" : true + }, + { + "textEditor" : true, + "refId" : "B", + "hide" : false, + "target" : "alias(averageSeries(groupByNode(collectd.$osd_servers.$domain.cpu.percent.{wait,interrupt,nice,user,system}, 1, \"sumSeries\")),\"Average OSD Host(s) CPU Busy\")" + } + ], + "stack" : false, + "fill" : 3, "steppedLine" : false, "bars" : false, - "renderer" : "flot", - "pointradius" : 5, - "span" : 6 + "datasource" : "Local" }, { - "aliasColors" : { - "Network load (rx+tx)" : "#3F6833" - }, - "seriesOverrides" : [], - "thresholds" : [], + "steppedLine" : false, + "bars" : false, + "datasource" : "Local", + "fill" : 1, + "dashLength" : 10, "targets" : [ { + "hide" : true, "target" : "collectd.$osd_servers.$domain.interface.*.if_octets.rx", - "refId" : "A", - "hide" : true + "refId" : "A" }, { + "hide" : true, "target" : "collectd.$osd_servers.$domain.interface.*.if_octets.tx", - "refId" : "B", - "hide" : true + "refId" : "B" }, { + "refId" : "C", "textEditor" : true, - "target" : "alias(sumSeries(#A,#B), \"Network load (rx+tx)\")", "targetFull" : "alias(sumSeries(collectd.$osd_servers.$domain.interface.*.if_octets.rx,collectd.$osd_servers.$domain.interface.*.if_octets.tx), \"Network load (rx+tx)\")", - "refId" : "C" - } - ], - "minSpan" : 6, - "title" : "Network Load - $osd_servers", - "links" : [ - { - "dashboard" : "Network Usage by Node", - "keepTime" : true, - "targetBlank" : true, - "dashUri" : "db/network-usage-by-node", - "includeVars" : true, - "title" : "Network Load by Node", - "type" : "dashboard" + "target" : "alias(sumSeries(#A,#B), \"Network load (rx+tx)\")" } ], + "stack" : false, "id" : 49, - "points" : false, - "fill" : 1, + "lines" : true, "xaxis" : { "values" : [], "name" : null, "buckets" : null, - "mode" : "time", - "show" : true + "show" : true, + "mode" : "time" }, - "spaceLength" : 10, "legend" : { - "values" : false, - "total" : false, "avg" : false, - "current" : false, - "max" : false, "show" : true, + "max" : false, + "values" : false, + "current" : false, + "total" : false, "min" : false }, - "nullPointMode" : "null", + "pointradius" : 5, + "seriesOverrides" : [], + "type" : "graph", "tooltip" : { "value_type" : "individual", "sort" : 0, "shared" : true }, - "dashes" : false, - "lines" : true, + "minSpan" : 6, + "links" : [ + { + "dashUri" : "db/network-usage-by-node", + "includeVars" : true, + "dashboard" : "Network Usage by Node", + "title" : "Network Load by Node", + "type" : "dashboard", + "keepTime" : true, + "targetBlank" : true + } + ], + "span" : 6, "linewidth" : 1, + "timeShift" : null, "yaxes" : [ { + "show" : true, "logBase" : 1, - "format" : "bytes", - "min" : null, + "max" : null, "label" : null, - "show" : true, - "max" : null + "min" : null, + "format" : "bytes" }, { - "format" : "short", + "show" : true, "logBase" : 1, "max" : null, - "show" : true, "label" : null, - "min" : null + "min" : null, + "format" : "short" } ], - "percentage" : false, - "dashLength" : 10, - "stack" : false, - "datasource" : "Local", - "type" : "graph", "timeFrom" : null, - "span" : 6, "renderer" : "flot", - "pointradius" : 5, - "bars" : false, - "steppedLine" : false, - "timeShift" : null + "spaceLength" : 10, + "dashes" : false, + "nullPointMode" : "null", + "title" : "Network Load - $osd_servers", + "points" : false, + "aliasColors" : { + "Network load (rx+tx)" : "#3F6833" + }, + "percentage" : false, + "thresholds" : [] } ], - "height" : 250, - "title" : "OSD Host CPU and Network Load" - } - ], - "title" : "Ceph Backend Storage", - "links" : [ - { - "includeVars" : true, - "tags" : [ - "overview" - ], - "icon" : "external link", - "title" : "Shortcuts", - "type" : "dashboards", - "keepTime" : true, - "targetBlank" : true, - "asDropdown" : true + "showTitle" : true, + "collapse" : true, + "titleSize" : "h5", + "repeatRowId" : null, + "title" : "OSD Host CPU and Network Load", + "repeat" : null, + "repeatIteration" : null, + "height" : 250 } ], - "id" : 13, - "style" : "dark", - "tags" : [], - "timepicker" : { - "time_options" : [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ], - "refresh_intervals" : [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ] - }, - "hideControls" : true, - "annotations" : { - "list" : [] - }, - "timezone" : "browser", - "graphTooltip" : 0, - "schemaVersion" : 14, - "time" : { - "from" : "now-1h", - "to" : "now" - }, - "refresh" : "10s", - "gnetId" : null, - "editable" : false + "refresh" : "10s" }, "meta" : { - "slug" : "ceph-backend-storage", "expires" : "0001-01-01T00:00:00Z", + "updatedBy" : "admin", + "type" : "db", + "canSave" : true, "canStar" : true, - "createdBy" : "admin", "canEdit" : true, - "updated" : "2017-08-18T21:45:43Z", - "version" : 18, - "canSave" : true, + "createdBy" : "admin", + "slug" : "ceph-backend-storage", + "updated" : "2017-08-21T03:31:38Z", "created" : "2017-08-03T21:42:28Z", - "updatedBy" : "admin", - "type" : "db" + "version" : 20 } } diff --git a/dashboards/current/ceph-health.json b/dashboards/current/ceph-health.json index 530bacd..0a53200 100644 --- a/dashboards/current/ceph-health.json +++ b/dashboards/current/ceph-health.json @@ -1,127 +1,78 @@ { "dashboard" : { - "id" : 29, - "links" : [ - { - "type" : "dashboards", - "tags" : [ - "overview" - ], - "icon" : "external link", - "title" : "Shortcuts", - "asDropdown" : true, - "targetBlank" : true, - "includeVars" : true, - "keepTime" : true - } - ], - "time" : { - "to" : "now", - "from" : "now-1h" - }, - "annotations" : { - "list" : [ - { - "tags" : "health_alert", - "type" : "alert", - "showIn" : 0, - "limit" : 100, - "iconColor" : "rgba(255, 96, 96, 1)", - "enable" : true, - "datasource" : "Local", - "hide" : false, - "name" : "health_alert" - }, - { - "enable" : true, - "hide" : false, - "name" : "health_ok", - "datasource" : "Local", - "limit" : 100, - "iconColor" : "rgb(1, 195, 0)", - "showIn" : 0, - "tags" : "health_ok", - "type" : "alert" - } - ] - }, - "style" : "dark", "templating" : { "list" : [ { - "regex" : "", - "useTags" : false, - "tags" : [], - "sort" : 0, - "query" : "collectd.*.$domain.cephmetrics.gauge.*", - "datasource" : "Local", - "name" : "cluster_name", - "hide" : 2, - "tagValuesQuery" : "", - "refresh" : 1, - "tagsQuery" : "", - "allValue" : null, - "type" : "query", "current" : { - "text" : "ceph", "value" : "ceph", + "text" : "ceph", "selected" : true }, + "refresh" : 1, "multi" : false, + "sort" : 0, + "regex" : "", + "hide" : 2, "includeAll" : false, + "tagValuesQuery" : "", + "tagsQuery" : "", + "name" : "cluster_name", + "datasource" : "Local", + "tags" : [], + "allValue" : null, + "useTags" : false, "options" : [], + "query" : "collectd.*.$domain.cephmetrics.gauge.*", + "type" : "query", "label" : null }, { - "type" : "custom", - "query" : "test.lab", + "allValue" : null, + "name" : "domain", + "hide" : 2, + "includeAll" : false, "current" : { - "value" : "test.lab", + "selected" : true, "text" : "test.lab", - "selected" : true + "value" : "test.lab" }, - "allValue" : null, + "multi" : false, + "type" : "custom", + "label" : null, + "query" : "test.lab", "options" : [ { "value" : "test.lab", - "text" : "test.lab", - "selected" : true + "selected" : true, + "text" : "test.lab" } - ], - "label" : null, - "multi" : false, - "hide" : 2, - "includeAll" : false, - "name" : "domain" + ] }, { "current" : { + "value" : "$__all", "selected" : true, - "text" : "All", - "value" : "$__all" + "text" : "All" }, - "query" : "ceph-1,ceph-2,ceph-3", - "type" : "custom", + "includeAll" : true, + "hide" : 2, "allValue" : null, "name" : "osd_servers", - "hide" : 2, - "includeAll" : true, - "multi" : true, "options" : [ { + "selected" : true, "text" : "All", - "value" : "$__all", - "selected" : true + "value" : "$__all" }, { - "value" : "ceph-1", "text" : "ceph-1", - "selected" : false + "selected" : false, + "value" : "ceph-1" }, { + "selected" : false, "text" : "ceph-2", - "value" : "ceph-2", - "selected" : false + "value" : "ceph-2" }, { "value" : "ceph-3", @@ -129,398 +80,403 @@ "selected" : false } ], - "label" : null + "multi" : true, + "label" : null, + "type" : "custom", + "query" : "ceph-1,ceph-2,ceph-3" }, { - "allValue" : null, - "query" : "85", - "current" : { - "text" : "85", - "value" : "85", - "selected" : true - }, - "type" : "custom", - "name" : "disk_full_threshold", - "hide" : 2, - "includeAll" : false, - "multi" : false, "options" : [ { - "selected" : true, "value" : "85", + "selected" : true, "text" : "85" } ], - "label" : null + "multi" : false, + "query" : "85", + "type" : "custom", + "label" : null, + "current" : { + "text" : "85", + "selected" : true, + "value" : "85" + }, + "hide" : 2, + "includeAll" : false, + "allValue" : null, + "name" : "disk_full_threshold" } ] }, - "gnetId" : null, - "tags" : [ - "overview" - ], "rows" : [ { - "repeatRowId" : null, "height" : "70", - "title" : "Dashboard Row", - "collapse" : false, "repeat" : null, + "collapse" : false, + "repeatRowId" : null, "titleSize" : "h6", - "showTitle" : false, + "repeatIteration" : null, "panels" : [ { - "span" : 12, - "nullText" : null, "timeShift" : null, - "title" : "", - "datasource" : "Local", + "timeFrom" : "1m", + "prefixFontSize" : "50%", "gauge" : { - "maxValue" : 100, + "thresholdMarkers" : true, "thresholdLabels" : false, "show" : false, "minValue" : 0, - "thresholdMarkers" : true + "maxValue" : 100 }, - "links" : [], + "mappingTypes" : [ + { + "value" : 1, + "name" : "value to text" + }, + { + "name" : "range to text", + "value" : 2 + } + ], + "height" : "70", + "postfixFontSize" : "50%", + "hideTimeOverride" : true, + "maxDataPoints" : "", "rangeMaps" : [ { + "text" : "HEALTH OK", "from" : "0", - "to" : "1", - "text" : "HEALTH OK" + "to" : "1" }, { + "to" : "4", "text" : "HEALTH WARNING", - "from" : "1", - "to" : "4" + "from" : "1" }, { - "text" : "HEALTH ERROR", "to" : "99", + "text" : "HEALTH ERROR", "from" : "5" }, { + "text" : "NODATA", "from" : "-10", - "to" : "0", - "text" : "NODATA" + "to" : "0" } ], - "mappingType" : 2, - "height" : "70", - "interval" : null, - "prefixFontSize" : "50%", + "format" : "none", "valueMaps" : [ { + "text" : "OK", "op" : "=", - "value" : "0", - "text" : "OK" + "value" : "0" }, { + "text" : "WARN", "op" : "=", - "value" : "4", - "text" : "WARN" + "value" : "4" }, { - "value" : "8", "text" : "ERROR", - "op" : "=" + "op" : "=", + "value" : "8" } ], - "tableColumn" : "", - "colorValue" : false, - "timeFrom" : "1m", - "nullPointMode" : "connected", - "mappingTypes" : [ - { - "value" : 1, - "name" : "value to text" - }, + "type" : "singlestat", + "cacheTimeout" : null, + "title" : "", + "targets" : [ { - "value" : 2, - "name" : "range to text" + "target" : "consolidateBy(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.health),\"max\")", + "textEditor" : true, + "refId" : "A" } ], - "type" : "singlestat", - "maxDataPoints" : "", - "format" : "none", + "prefix" : "", + "valueName" : "current", + "description" : "Shows the overall health of the ceph cluster. To see specific health messages hover over the annotation in the health chart below.", + "datasource" : "Local", + "colorValue" : false, + "colorBackground" : true, + "links" : [], + "postfix" : "", + "nullText" : null, + "minSpan" : 1, + "nullPointMode" : "connected", "colors" : [ "rgba(1, 167, 1, 1)", "rgba(255,165,0, 1)", "rgba(255, 0, 0, 1)" ], - "minSpan" : 1, - "description" : "Shows the overall health of the ceph cluster. To see specific health messages hover over the annotation in the health chart below.", - "cacheTimeout" : null, - "valueName" : "current", + "mappingType" : 2, + "interval" : null, "id" : 76, + "span" : 12, + "valueFontSize" : "50%", "thresholds" : "1,5", "sparkline" : { "lineColor" : "rgb(31, 120, 193)", "show" : false, - "full" : false, - "fillColor" : "rgba(31, 118, 189, 0.18)" + "fillColor" : "rgba(31, 118, 189, 0.18)", + "full" : false }, - "targets" : [ - { - "refId" : "A", - "target" : "consolidateBy(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.health),\"max\")", - "textEditor" : true - } - ], - "valueFontSize" : "50%", - "postfix" : "", - "hideTimeOverride" : true, - "postfixFontSize" : "50%", - "prefix" : "", - "colorBackground" : true + "tableColumn" : "" } ], - "repeatIteration" : null + "title" : "Dashboard Row", + "showTitle" : false }, { - "repeat" : null, - "repeatRowId" : null, "height" : "350", + "repeat" : null, "collapse" : false, - "title" : "Cluster Health", - "showTitle" : true, + "repeatRowId" : null, + "titleSize" : "h5", + "repeatIteration" : null, "panels" : [ { - "spaceLength" : 10, - "targets" : [ - { - "textEditor" : true, - "target" : "alias(maxSeries(summarize(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.health,\"5min\",\"max\")), 'Ceph Health')", - "refId" : "A" - } - ], - "yaxes" : [ + "xaxis" : { + "mode" : "time", + "buckets" : null, + "show" : true, + "values" : [], + "name" : null + }, + "pointradius" : 5, + "thresholds" : [ { - "format" : "short", - "logBase" : 1, - "show" : false, - "label" : "", - "max" : "10", - "min" : "-1" - }, - { - "max" : null, - "min" : null, - "label" : null, - "logBase" : 1, - "show" : false, - "format" : "short" - } - ], - "lines" : true, - "points" : false, - "steppedLine" : true, - "hideTimeOverride" : true, - "description" : "The chart plots the clusters health, over time. Health is depicted as a integer; 0, 4 or 8 where 0 is OK, 4 is WARN and 8 represents an ERROR state. Horizontal thresholds (drawn in yellow and red) indicate when the cluster's health transitions to 'warning' or 'error'. Annotations describing the details of the clusters health may also be shown if the \"EventURL\" setting is defined to the collectd plugin on the mon hosts.", - "bars" : false, - "minSpan" : 3, - "renderer" : "flot", - "thresholds" : [ - { - "op" : "gt", + "value" : 3, + "fillColor" : "rgba(222, 226, 0, 0.47)", + "lineColor" : "rgb(247, 172, 0)", "line" : true, "fill" : false, - "lineColor" : "rgb(247, 172, 0)", - "value" : 3, "colorMode" : "custom", - "fillColor" : "rgba(222, 226, 0, 0.47)" + "op" : "gt" }, { - "op" : "gt", + "fillColor" : "rgba(246, 3, 3, 0.5)", + "value" : 7, "fill" : false, "line" : true, - "lineColor" : "rgb(203, 0, 0)", - "value" : 7, + "op" : "gt", "colorMode" : "custom", - "fillColor" : "rgba(246, 3, 3, 0.5)" + "lineColor" : "rgb(203, 0, 0)" } ], + "span" : 12, "dashLength" : 10, "id" : 55, + "description" : "The chart plots the clusters health, over time. Health is depicted as a integer; 0, 4 or 8 where 0 is OK, 4 is WARN and 8 represents an ERROR state. Horizontal thresholds (drawn in yellow and red) indicate when the cluster's health transitions to 'warning' or 'error'. Annotations describing the details of the clusters health may also be shown if the \"EventURL\" setting is defined to the collectd plugin on the mon hosts.", + "datasource" : "Local", + "bars" : false, + "fill" : 1, + "yaxes" : [ + { + "logBase" : 1, + "format" : "short", + "min" : "-1", + "show" : false, + "label" : "", + "max" : "10" + }, + { + "format" : "short", + "logBase" : 1, + "max" : null, + "label" : null, + "show" : false, + "min" : null + } + ], "nullPointMode" : "null", - "timeFrom" : "3d", - "xaxis" : { - "mode" : "time", - "buckets" : null, - "name" : null, - "show" : true, - "values" : [] - }, + "minSpan" : 3, + "dashes" : false, + "links" : [], "aliasColors" : { "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.health" : "#DEDAF7", - "Ceph Health" : "#3F6833", - "Ceph Health (0:OK, 4:Warning,8:Error)" : "#DEDAF7" + "Ceph Health (0:OK, 4:Warning,8:Error)" : "#DEDAF7", + "Ceph Health" : "#3F6833" }, - "height" : "350", - "fill" : 1, - "linewidth" : 2, - "maxDataPoints" : "", "percentage" : false, - "type" : "graph", + "lines" : true, + "points" : false, "tooltip" : { - "sort" : 1, + "value_type" : "individual", "shared" : false, - "value_type" : "individual" + "sort" : 1 }, - "datasource" : "Local", + "steppedLine" : true, "seriesOverrides" : [], - "timeShift" : null, "title" : "Health History - Last 3 days", - "pointradius" : 5, - "span" : 12, + "targets" : [ + { + "target" : "alias(maxSeries(summarize(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.health,\"5min\",\"max\")), 'Ceph Health')", + "textEditor" : true, + "refId" : "A" + } + ], + "hideTimeOverride" : true, "stack" : false, + "height" : "350", + "spaceLength" : 10, + "linewidth" : 2, + "timeFrom" : "3d", + "renderer" : "flot", + "timeShift" : null, + "type" : "graph", + "maxDataPoints" : "", "legend" : { - "values" : false, - "max" : false, - "min" : false, "total" : false, - "avg" : false, "current" : false, + "avg" : false, + "min" : false, + "values" : false, + "max" : false, "show" : true - }, - "dashes" : false, - "links" : [] + } } ], - "repeatIteration" : null, - "titleSize" : "h5" + "title" : "Cluster Health", + "showTitle" : true }, { + "collapse" : false, "repeatIteration" : null, + "titleSize" : "h5", "panels" : [ { "content" : "", - "links" : [], - "id" : 69, - "type" : "text", "transparent" : true, - "mode" : "html", - "span" : 1, "minSpan" : 1, - "title" : "" + "type" : "text", + "links" : [], + "span" : 1, + "title" : "", + "id" : 69, + "mode" : "html" }, { - "columns" : [ + "pageSize" : null, + "sort" : { + "desc" : false, + "col" : null + }, + "title" : "Monitor Status", + "span" : 3, + "targets" : [ { - "value" : "current", - "text" : "Current" + "target" : "aliasByNode(groupByNode(transformNull(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.mon_status.*),-1),-1,\"maxSeries\"),-1)", + "textEditor" : true, + "refId" : "B" } ], "id" : 56, + "columns" : [ + { + "text" : "Current", + "value" : "current" + } + ], + "showHeader" : true, + "scroll" : true, + "type" : "table", + "minSpan" : 2, "links" : [], - "sort" : { - "desc" : false, - "col" : null - }, + "transform" : "timeseries_aggregations", + "fontSize" : "100%", + "maxDataPoints" : "", + "hideTimeOverride" : true, + "timeFrom" : "1m", "styles" : [ { - "type" : "date", + "pattern" : "Time", "alias" : "Time", "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "pattern" : "Time" + "type" : "date" }, { - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "unit" : "short", - "pattern" : "Metric", "sanitize" : false, - "alias" : "Hostname", - "type" : "number", - "colorMode" : null, - "thresholds" : [], "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "decimals" : 2 + "pattern" : "Metric", + "type" : "number", + "thresholds" : [], + "unit" : "short", + "colorMode" : null, + "decimals" : 2, + "alias" : "Hostname", + "dateFormat" : "YYYY-MM-DD HH:mm:ss" }, { - "colors" : [ - "rgba(245, 54, 54, 0.9)", - "rgba(0, 169, 3, 0.89)", - "rgba(249, 190, 0, 0.97)" - ], - "decimals" : 0, - "type" : "number", - "alias" : "Status", - "colorMode" : "row", "thresholds" : [ "0", "3", "7" ], - "unit" : "short", + "type" : "number", + "alias" : "Status", "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "unit" : "short", + "colorMode" : "row", + "decimals" : 0, + "colors" : [ + "rgba(245, 54, 54, 0.9)", + "rgba(0, 169, 3, 0.89)", + "rgba(249, 190, 0, 0.97)" + ], "pattern" : "Current" }, { + "type" : "number", + "thresholds" : [], + "unit" : "short", + "decimals" : 2, + "colorMode" : null, + "alias" : "", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "decimals" : 2, - "unit" : "short", - "pattern" : "/.*/", - "alias" : "", - "type" : "number", - "thresholds" : [], - "colorMode" : null - } - ], - "span" : 3, - "title" : "Monitor Status", - "timeShift" : null, - "minSpan" : 2, - "fontSize" : "100%", - "maxDataPoints" : "", - "hideTimeOverride" : true, - "type" : "table", - "transform" : "timeseries_aggregations", - "timeFrom" : "1m", - "pageSize" : null, - "showHeader" : true, - "targets" : [ - { - "refId" : "B", - "target" : "aliasByNode(groupByNode(transformNull(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.mon_status.*),-1),-1,\"maxSeries\"),-1)", - "textEditor" : true + "pattern" : "/.*/" } ], - "scroll" : true + "timeShift" : null }, { - "type" : "text", "content" : "", - "id" : 68, - "links" : [], - "mode" : "html", "transparent" : true, "minSpan" : 2, + "type" : "text", + "links" : [], + "span" : 2, "title" : "", - "span" : 2 + "id" : 68, + "mode" : "html" }, { - "span" : 1, - "minSpan" : 1, - "title" : "", - "id" : 58, - "links" : [], + "transparent" : true, "content" : "

Cluster Flags:

", + "minSpan" : 1, "type" : "text", + "id" : 58, "mode" : "html", - "transparent" : true + "links" : [], + "span" : 1, + "title" : "" }, { - "interval" : null, - "mappingType" : 1, - "height" : "95", + "gauge" : { + "show" : false, + "minValue" : 0, + "maxValue" : 100, + "thresholdLabels" : false, + "thresholdMarkers" : true + }, "mappingTypes" : [ { "name" : "value to text", @@ -531,15 +487,16 @@ "name" : "range to text" } ], - "colorValue" : false, - "nullPointMode" : "connected", + "height" : "95", + "postfixFontSize" : "50%", + "hideTimeOverride" : true, "timeFrom" : "1m", "prefixFontSize" : "50%", "valueMaps" : [ { + "text" : "N/A", "op" : "=", - "value" : "null", - "text" : "N/A" + "value" : "null" }, { "value" : "0", @@ -547,87 +504,104 @@ "op" : "=" }, { - "op" : "=", "value" : "1", + "op" : "=", "text" : "ACTIVE" }, { - "value" : "2", "text" : "DISABLED", - "op" : "=" - } + "op" : "=", + "value" : "2" + } ], - "tableColumn" : "", "type" : "singlestat", "maxDataPoints" : "", - "format" : "none", - "title" : "SCRUB", - "nullText" : null, - "span" : 1, - "gauge" : { - "show" : false, - "minValue" : 0, - "thresholdMarkers" : true, - "maxValue" : 100, - "thresholdLabels" : false - }, - "datasource" : "Local", "rangeMaps" : [ { - "to" : "null", + "text" : "N/A", "from" : "null", - "text" : "N/A" + "to" : "null" } ], - "links" : [], - "valueFontSize" : "40%", + "format" : "none", + "prefix" : "", + "cacheTimeout" : null, + "title" : "SCRUB", "targets" : [ { "refId" : "A", - "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.scrub),\"maxSeries\"))", - "textEditor" : true + "textEditor" : true, + "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.scrub),\"maxSeries\"))" } ], - "postfix" : "", - "postfixFontSize" : "50%", - "hideTimeOverride" : true, - "prefix" : "", + "description" : "Scrub activity takes place daily basis across the OSD's and performs object size and attribute checks. Scrub activity can be controlled with the \"ceph osd scrub\" command.", + "datasource" : "Local", + "colorValue" : false, "colorBackground" : true, + "valueName" : "current", + "nullText" : null, "minSpan" : 1, + "nullPointMode" : "connected", + "links" : [], + "postfix" : "", "colors" : [ "rgba(50, 172, 45, 0.97)", "rgba(237, 129, 40, 0.89)", "rgba(245, 54, 54, 0.9)" ], - "description" : "Scrub activity takes place daily basis across the OSD's and performs object size and attribute checks. Scrub activity can be controlled with the \"ceph osd scrub\" command.", + "mappingType" : 1, + "interval" : null, "thresholds" : "1,2", "sparkline" : { + "lineColor" : "rgb(31, 120, 193)", "fillColor" : "rgba(31, 118, 189, 0.18)", + "show" : false, + "full" : false + }, + "tableColumn" : "", + "id" : 57, + "span" : 1, + "valueFontSize" : "40%" + }, + { + "thresholds" : "1,2", + "tableColumn" : "", + "sparkline" : { "full" : false, + "fillColor" : "rgba(31, 118, 189, 0.18)", "show" : false, "lineColor" : "rgb(31, 120, 193)" }, + "id" : 59, + "valueFontSize" : "40%", + "span" : 1, + "colors" : [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "interval" : null, + "mappingType" : 1, + "nullText" : null, + "nullPointMode" : "connected", + "minSpan" : 1, + "links" : [], + "postfix" : "", + "description" : "Deep scrub acts on the objects within placement groups (PGs). Objects are read, and checksum's compared to protect against silent bit-rot events. Although a weekly activity, in large clusters is normal to see deep-scrub active on a daily basis. Scrub activity can be controlled with the \"ceph osd scrub\" command.", + "datasource" : "Local", + "colorBackground" : true, + "colorValue" : false, "valueName" : "current", + "prefix" : "", "cacheTimeout" : null, - "id" : 57 - }, - { - "format" : "none", - "maxDataPoints" : "", - "type" : "singlestat", - "mappingTypes" : [ - { - "value" : 1, - "name" : "value to text" - }, + "title" : "DEEP SCRUB", + "targets" : [ { - "value" : 2, - "name" : "range to text" + "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.deep_scrub),\"maxSeries\"))", + "textEditor" : true, + "refId" : "A" } ], - "timeFrom" : "1m", - "colorValue" : false, - "nullPointMode" : "connected", "valueMaps" : [ { "value" : "null", @@ -645,135 +619,120 @@ "op" : "=" }, { - "text" : "DISABLED", "value" : "2", - "op" : "=" + "op" : "=", + "text" : "DISABLED" } ], - "prefixFontSize" : "50%", - "tableColumn" : "", - "interval" : null, - "mappingType" : 1, - "height" : "95", + "type" : "singlestat", "rangeMaps" : [ { - "text" : "N/A", + "to" : "null", "from" : "null", - "to" : "null" + "text" : "N/A" + } + ], + "maxDataPoints" : "", + "format" : "none", + "height" : "95", + "mappingTypes" : [ + { + "name" : "value to text", + "value" : 1 + }, + { + "name" : "range to text", + "value" : 2 } ], - "links" : [], "gauge" : { + "maxValue" : 100, "show" : false, "minValue" : 0, "thresholdMarkers" : true, - "thresholdLabels" : false, - "maxValue" : 100 + "thresholdLabels" : false }, - "datasource" : "Local", - "title" : "DEEP SCRUB", - "nullText" : null, - "span" : 1, - "colorBackground" : true, - "prefix" : "", "postfixFontSize" : "50%", "hideTimeOverride" : true, - "postfix" : "", - "valueFontSize" : "40%", - "targets" : [ - { - "refId" : "A", - "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.deep_scrub),\"maxSeries\"))", - "textEditor" : true - } - ], - "sparkline" : { - "full" : false, - "fillColor" : "rgba(31, 118, 189, 0.18)", - "lineColor" : "rgb(31, 120, 193)", - "show" : false - }, - "thresholds" : "1,2", - "id" : 59, - "valueName" : "current", - "cacheTimeout" : null, - "description" : "Deep scrub acts on the objects within placement groups (PGs). Objects are read, and checksum's compared to protect against silent bit-rot events. Although a weekly activity, in large clusters is normal to see deep-scrub active on a daily basis. Scrub activity can be controlled with the \"ceph osd scrub\" command.", - "minSpan" : 1, - "colors" : [ - "rgba(50, 172, 45, 0.97)", - "rgba(237, 129, 40, 0.89)", - "rgba(245, 54, 54, 0.9)" - ] + "prefixFontSize" : "50%", + "timeFrom" : "1m" }, { - "description" : "With the recovery flag enabled, disruption in the cluster will result in data being recreated to freespace within the cluster to honor the pool's protection schema. Under some circumstances, you may use the norecover flag to prevent automatic recovery.", - "minSpan" : 1, "colors" : [ "rgba(50, 172, 45, 0.97)", "rgba(237, 129, 40, 0.89)", "rgba(245, 54, 54, 0.9)" ], + "mappingType" : 1, + "interval" : null, + "id" : 60, + "valueFontSize" : "40%", + "span" : 1, "thresholds" : "1,2", "sparkline" : { "lineColor" : "rgb(31, 120, 193)", "show" : false, - "full" : false, - "fillColor" : "rgba(31, 118, 189, 0.18)" + "fillColor" : "rgba(31, 118, 189, 0.18)", + "full" : false }, - "id" : 60, + "tableColumn" : "", "valueName" : "current", - "cacheTimeout" : null, + "datasource" : "Local", + "description" : "With the recovery flag enabled, disruption in the cluster will result in data being recreated to freespace within the cluster to honor the pool's protection schema. Under some circumstances, you may use the norecover flag to prevent automatic recovery.", + "colorValue" : false, + "colorBackground" : true, "postfix" : "", - "valueFontSize" : "40%", + "links" : [], + "nullText" : null, + "nullPointMode" : "connected", + "minSpan" : 1, + "cacheTimeout" : null, "targets" : [ { - "refId" : "A", "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.recovery),\"maxSeries\"))", - "textEditor" : true + "textEditor" : true, + "refId" : "A" } ], + "title" : "RECOVERY", "prefix" : "", - "colorBackground" : true, - "postfixFontSize" : "50%", - "hideTimeOverride" : true, + "timeFrom" : "1m", + "prefixFontSize" : "50%", "gauge" : { - "thresholdMarkers" : true, "minValue" : 0, "show" : false, - "thresholdLabels" : false, - "maxValue" : 100 + "maxValue" : 100, + "thresholdMarkers" : true, + "thresholdLabels" : false }, - "datasource" : "Local", - "title" : "RECOVERY", - "nullText" : null, - "span" : 1, - "rangeMaps" : [ - { - "text" : "N/A", - "from" : "null", - "to" : "null" - } - ], - "links" : [], "mappingTypes" : [ { "value" : 1, "name" : "value to text" }, { - "value" : 2, - "name" : "range to text" + "name" : "range to text", + "value" : 2 } ], - "nullPointMode" : "connected", - "colorValue" : false, - "timeFrom" : "1m", - "tableColumn" : "", + "height" : "95", + "postfixFontSize" : "50%", + "hideTimeOverride" : true, + "maxDataPoints" : "", + "rangeMaps" : [ + { + "to" : "null", + "from" : "null", + "text" : "N/A" + } + ], + "format" : "none", + "type" : "singlestat", "valueMaps" : [ { "value" : "null", - "text" : "N/A", - "op" : "=" + "op" : "=", + "text" : "N/A" }, { "op" : "=", @@ -781,128 +740,147 @@ "value" : "0" }, { - "value" : "1", + "op" : "=", "text" : "ACTIVE", - "op" : "=" + "value" : "1" }, { - "op" : "=", "value" : "2", + "op" : "=", "text" : "DISABLED" } - ], - "prefixFontSize" : "50%", - "interval" : null, - "mappingType" : 1, - "height" : "95", - "format" : "none", - "maxDataPoints" : "", - "type" : "singlestat" + ] }, { - "prefix" : "", - "colorBackground" : true, - "postfixFontSize" : "50%", - "hideTimeOverride" : true, - "postfix" : "", + "cacheTimeout" : null, "targets" : [ { + "refId" : "A", "textEditor" : true, - "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.backfill),\"maxSeries\"))", - "refId" : "A" + "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.backfill),\"maxSeries\"))" } ], - "valueFontSize" : "40%", - "thresholds" : "1,2", - "sparkline" : { - "show" : false, - "lineColor" : "rgb(31, 120, 193)", - "fillColor" : "rgba(31, 118, 189, 0.18)", - "full" : false - }, - "cacheTimeout" : null, - "valueName" : "current", - "id" : 64, - "minSpan" : 1, - "colors" : [ - "rgba(50, 172, 45, 0.97)", - "rgba(237, 129, 40, 0.89)", - "rgba(245, 54, 54, 0.9)" - ], - "format" : "none", + "title" : "BACKFILL", + "prefix" : "", "maxDataPoints" : "", - "type" : "singlestat", - "colorValue" : false, - "nullPointMode" : "connected", - "timeFrom" : "1m", - "mappingTypes" : [ - { - "name" : "value to text", - "value" : 1 - }, + "rangeMaps" : [ { - "name" : "range to text", - "value" : 2 + "to" : "null", + "from" : "null", + "text" : "N/A" } ], + "format" : "none", + "type" : "singlestat", "valueMaps" : [ { - "value" : "null", + "op" : "=", "text" : "N/A", - "op" : "=" + "value" : "null" }, { + "op" : "=", "text" : "ENABLED", - "value" : "0", - "op" : "=" + "value" : "0" }, { + "text" : "ACTIVE", "op" : "=", - "value" : "1", - "text" : "ACTIVE" + "value" : "1" }, { "value" : "2", - "text" : "DISABLED", - "op" : "=" + "op" : "=", + "text" : "DISABLED" } ], + "timeFrom" : "1m", "prefixFontSize" : "50%", + "gauge" : { + "thresholdMarkers" : true, + "thresholdLabels" : false, + "minValue" : 0, + "show" : false, + "maxValue" : 100 + }, + "height" : "95", + "mappingTypes" : [ + { + "value" : 1, + "name" : "value to text" + }, + { + "name" : "range to text", + "value" : 2 + } + ], + "postfixFontSize" : "50%", + "hideTimeOverride" : true, + "id" : 64, + "span" : 1, + "valueFontSize" : "40%", + "thresholds" : "1,2", + "sparkline" : { + "lineColor" : "rgb(31, 120, 193)", + "show" : false, + "fillColor" : "rgba(31, 118, 189, 0.18)", + "full" : false + }, "tableColumn" : "", + "colors" : [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], "mappingType" : 1, - "height" : "95", "interval" : null, + "postfix" : "", "links" : [], - "rangeMaps" : [ + "nullText" : null, + "nullPointMode" : "connected", + "minSpan" : 1, + "valueName" : "current", + "datasource" : "Local", + "colorValue" : false, + "colorBackground" : true + }, + { + "prefix" : "", + "targets" : [ { - "text" : "N/A", - "from" : "null", - "to" : "null" + "refId" : "A", + "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.rebalance),\"maxSeries\"))", + "textEditor" : true } ], + "title" : "REBALANCE", + "cacheTimeout" : null, + "postfixFontSize" : "50%", + "hideTimeOverride" : true, "gauge" : { "minValue" : 0, "show" : false, + "maxValue" : 100, "thresholdMarkers" : true, - "thresholdLabels" : false, - "maxValue" : 100 + "thresholdLabels" : false }, - "datasource" : "Local", - "nullText" : null, - "title" : "BACKFILL", - "span" : 1 - }, - { - "type" : "singlestat", - "maxDataPoints" : "", - "format" : "none", - "interval" : null, - "mappingType" : 1, "height" : "95", + "mappingTypes" : [ + { + "name" : "value to text", + "value" : 1 + }, + { + "value" : 2, + "name" : "range to text" + } + ], + "timeFrom" : "1m", + "prefixFontSize" : "50%", "valueMaps" : [ { - "op" : "=", "value" : "null", + "op" : "=", "text" : "N/A" }, { @@ -916,174 +894,148 @@ "value" : "1" }, { - "value" : "2", "text" : "DISABLED", - "op" : "=" - } - ], - "prefixFontSize" : "50%", - "tableColumn" : "", - "mappingTypes" : [ - { - "name" : "value to text", - "value" : 1 - }, - { - "name" : "range to text", - "value" : 2 + "op" : "=", + "value" : "2" } ], - "nullPointMode" : "connected", - "colorValue" : false, - "timeFrom" : "1m", + "type" : "singlestat", + "format" : "none", + "maxDataPoints" : "", "rangeMaps" : [ { + "text" : "N/A", "from" : "null", - "to" : "null", - "text" : "N/A" - } - ], - "links" : [], - "span" : 1, - "title" : "REBALANCE", - "nullText" : null, - "datasource" : "Local", - "gauge" : { - "thresholdMarkers" : true, - "minValue" : 0, - "show" : false, - "thresholdLabels" : false, - "maxValue" : 100 - }, - "hideTimeOverride" : true, - "postfixFontSize" : "50%", - "prefix" : "", - "colorBackground" : true, - "valueFontSize" : "40%", - "targets" : [ - { - "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.rebalance),\"maxSeries\"))", - "textEditor" : true, - "refId" : "A" + "to" : "null" } ], - "postfix" : "", - "id" : 61, - "valueName" : "current", - "cacheTimeout" : null, - "sparkline" : { - "lineColor" : "rgb(31, 120, 193)", - "show" : false, - "fillColor" : "rgba(31, 118, 189, 0.18)", - "full" : false - }, - "thresholds" : "1,2", + "mappingType" : 1, + "interval" : null, "colors" : [ "rgba(50, 172, 45, 0.97)", "rgba(237, 129, 40, 0.89)", "rgba(245, 54, 54, 0.9)" ], - "minSpan" : 1 - }, - { - "valueName" : "current", - "id" : 62, - "cacheTimeout" : null, - "thresholds" : "1,2", "sparkline" : { - "lineColor" : "rgb(31, 120, 193)", "show" : false, "fillColor" : "rgba(31, 118, 189, 0.18)", - "full" : false + "full" : false, + "lineColor" : "rgb(31, 120, 193)" }, - "colors" : [ - "rgba(50, 172, 45, 0.97)", - "rgba(237, 129, 40, 0.89)", - "rgba(245, 54, 54, 0.9)" - ], + "tableColumn" : "", + "thresholds" : "1,2", + "valueFontSize" : "40%", + "span" : 1, + "id" : 61, + "colorValue" : false, + "colorBackground" : true, + "datasource" : "Local", + "valueName" : "current", "minSpan" : 1, - "description" : "The OUT flag setting allows the mon's to mark OSD's as out of the configuration when they stop sending hearbeats to the mon's. By marking them OUT, recovery takes place. However, for planned maintenance you can set the cluster to noout to disable this behavior.", - "hideTimeOverride" : true, + "nullPointMode" : "connected", + "nullText" : null, + "links" : [], + "postfix" : "" + }, + { + "prefixFontSize" : "50%", + "timeFrom" : "1m", + "timeShift" : null, "postfixFontSize" : "50%", - "colorBackground" : true, - "prefix" : "", - "valueFontSize" : "40%", - "targets" : [ + "hideTimeOverride" : true, + "height" : "95", + "mappingTypes" : [ { - "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.out),\"maxSeries\"))", - "textEditor" : true, - "refId" : "A" - } - ], - "postfix" : "", - "rangeMaps" : [ + "name" : "value to text", + "value" : 1 + }, { - "to" : "null", - "from" : "null", - "text" : "N/A" + "value" : 2, + "name" : "range to text" } ], - "links" : [], - "span" : 1, - "title" : "OUT", - "timeShift" : null, - "nullText" : null, - "datasource" : "Local", "gauge" : { - "maxValue" : 100, - "thresholdLabels" : false, "thresholdMarkers" : true, + "thresholdLabels" : false, + "maxValue" : 100, "minValue" : 0, "show" : false }, - "type" : "singlestat", - "maxDataPoints" : "", "format" : "none", - "interval" : null, - "height" : "95", - "mappingType" : 1, + "rangeMaps" : [ + { + "to" : "null", + "text" : "N/A", + "from" : "null" + } + ], + "maxDataPoints" : "", + "type" : "singlestat", "valueMaps" : [ { "text" : "N/A", - "value" : "null", - "op" : "=" + "op" : "=", + "value" : "null" }, { "text" : "ENABLED", - "value" : "0", - "op" : "=" + "op" : "=", + "value" : "0" }, { - "op" : "=", "value" : "1", - "text" : "ACTIVE" + "text" : "ACTIVE", + "op" : "=" }, { - "value" : "2", "text" : "DISABLED", - "op" : "=" + "op" : "=", + "value" : "2" }, { - "op" : "=", "value" : "-1", - "text" : "NODATA" + "text" : "NODATA", + "op" : "=" } ], - "tableColumn" : "", - "prefixFontSize" : "50%", - "mappingTypes" : [ - { - "value" : 1, - "name" : "value to text" - }, + "title" : "OUT", + "targets" : [ { - "name" : "range to text", - "value" : 2 + "refId" : "A", + "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.out),\"maxSeries\"))", + "textEditor" : true } ], - "nullPointMode" : "connected", + "cacheTimeout" : null, + "prefix" : "", + "valueName" : "current", + "colorBackground" : true, "colorValue" : false, - "timeFrom" : "1m" + "description" : "The OUT flag setting allows the mon's to mark OSD's as out of the configuration when they stop sending hearbeats to the mon's. By marking them OUT, recovery takes place. However, for planned maintenance you can set the cluster to noout to disable this behavior.", + "datasource" : "Local", + "postfix" : "", + "links" : [], + "nullPointMode" : "connected", + "minSpan" : 1, + "nullText" : null, + "interval" : null, + "mappingType" : 1, + "colors" : [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "span" : 1, + "valueFontSize" : "40%", + "id" : 62, + "tableColumn" : "", + "sparkline" : { + "lineColor" : "rgb(31, 120, 193)", + "full" : false, + "show" : false, + "fillColor" : "rgba(31, 118, 189, 0.18)" + }, + "thresholds" : "1,2" }, { "sparkline" : { @@ -1092,67 +1044,38 @@ "show" : false, "lineColor" : "rgb(31, 120, 193)" }, + "tableColumn" : "", "thresholds" : "1,2", - "valueName" : "current", + "span" : 1, + "valueFontSize" : "40%", "id" : 63, - "cacheTimeout" : null, - "description" : "The down feature allows OSD's to mark their peers as DOWN when they are not reachable. However, if there is a poor network or planned outages, you may want to set this flag to nodown to prevent OSD's flapping between up/down states", - "minSpan" : 1, + "mappingType" : 1, + "interval" : null, "colors" : [ "rgba(50, 172, 45, 0.97)", "rgba(237, 129, 40, 0.89)", "rgba(245, 54, 54, 0.9)" ], - "prefix" : "", - "colorBackground" : true, - "postfixFontSize" : "50%", - "hideTimeOverride" : true, + "minSpan" : 1, + "nullPointMode" : "connected", + "nullText" : null, "postfix" : "", + "links" : [], + "colorValue" : false, + "colorBackground" : true, + "description" : "The down feature allows OSD's to mark their peers as DOWN when they are not reachable. However, if there is a poor network or planned outages, you may want to set this flag to nodown to prevent OSD's flapping between up/down states", + "datasource" : "Local", + "valueName" : "current", + "prefix" : "", "targets" : [ { "refId" : "A", - "textEditor" : true, - "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.down),\"maxSeries\"))" - } - ], - "valueFontSize" : "40%", - "links" : [], - "rangeMaps" : [ - { - "text" : "N/A", - "from" : "null", - "to" : "null" + "target" : "maxSeries(consolidateBy(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.features.down),\"maxSeries\"))", + "textEditor" : true } ], - "gauge" : { - "thresholdMarkers" : true, - "minValue" : 0, - "show" : false, - "maxValue" : 100, - "thresholdLabels" : false - }, - "datasource" : "Local", - "nullText" : null, - "timeShift" : null, "title" : "DOWN", - "span" : 1, - "format" : "none", - "maxDataPoints" : "", - "type" : "singlestat", - "nullPointMode" : "connected", - "colorValue" : false, - "timeFrom" : "1m", - "mappingTypes" : [ - { - "value" : 1, - "name" : "value to text" - }, - { - "name" : "range to text", - "value" : 2 - } - ], - "tableColumn" : "", + "cacheTimeout" : null, "valueMaps" : [ { "value" : "null", @@ -1160,368 +1083,325 @@ "op" : "=" }, { - "op" : "=", "value" : "0", - "text" : "ENABLED" + "text" : "ENABLED", + "op" : "=" }, { "value" : "1", - "text" : "ACTIVE", - "op" : "=" + "op" : "=", + "text" : "ACTIVE" }, { - "op" : "=", "text" : "DISABLED", + "op" : "=", "value" : "2" } ], - "prefixFontSize" : "50%", + "type" : "singlestat", + "format" : "none", + "maxDataPoints" : "", + "rangeMaps" : [ + { + "from" : "null", + "text" : "N/A", + "to" : "null" + } + ], + "postfixFontSize" : "50%", + "hideTimeOverride" : true, + "gauge" : { + "thresholdLabels" : false, + "thresholdMarkers" : true, + "maxValue" : 100, + "minValue" : 0, + "show" : false + }, "height" : "95", - "mappingType" : 1, - "interval" : null + "mappingTypes" : [ + { + "name" : "value to text", + "value" : 1 + }, + { + "value" : 2, + "name" : "range to text" + } + ], + "timeFrom" : "1m", + "prefixFontSize" : "50%", + "timeShift" : null } ], - "showTitle" : true, - "titleSize" : "h5", - "repeat" : null, + "repeatRowId" : null, "title" : "Cluster State", - "collapse" : false, + "showTitle" : true, "height" : "200", - "repeatRowId" : null + "repeat" : null }, { - "titleSize" : "h5", - "repeatIteration" : null, + "repeat" : null, + "height" : 250, + "collapse" : false, "showTitle" : true, + "title" : "Storage Information", + "repeatRowId" : null, "panels" : [ { - "transform" : "timeseries_aggregations", - "title" : "Disks Near Full", "scroll" : true, - "minSpan" : 1, - "pageSize" : null, "showHeader" : true, - "targets" : [ - { - "textEditor" : true, - "target" : "aliasByNode(currentAbove(transformNull(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.osd_percent_used),0),$disk_full_threshold),1,-2)", - "refId" : "A" - } - ], - "span" : 1, - "fontSize" : "100%", - "columns" : [ - { - "value" : "current", - "text" : "Current" - } - ], - "sort" : { - "desc" : true, - "col" : 0 - }, - "type" : "table", "styles" : [ { - "type" : "date", + "pattern" : "Time", "alias" : "Time", "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "pattern" : "Time" + "type" : "date" }, { - "colorMode" : null, + "colors" : [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "pattern" : "Current", "thresholds" : [], "type" : "hidden", "alias" : "% Full", - "unit" : "none", "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "pattern" : "Current", + "unit" : "none", + "decimals" : 0, + "colorMode" : null + }, + { "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "decimals" : 0 - }, - { - "alias" : "Host.OSD Id", - "type" : "number", - "colorMode" : null, - "thresholds" : [], "pattern" : "Metric", "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "alias" : "Host.OSD Id", "unit" : "short", "decimals" : 2, - "colors" : [ - "rgba(245, 54, 54, 0.9)", - "rgba(237, 129, 40, 0.89)", - "rgba(50, 172, 45, 0.97)" - ] + "colorMode" : null, + "thresholds" : [], + "type" : "number" }, { + "pattern" : "/.*/", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "decimals" : 2, - "unit" : "short", - "pattern" : "/.*/", - "type" : "number", "alias" : "", "colorMode" : null, - "thresholds" : [] + "decimals" : 2, + "unit" : "short", + "thresholds" : [], + "type" : "number" } ], + "columns" : [ + { + "value" : "current", + "text" : "Current" + } + ], + "transform" : "timeseries_aggregations", "id" : 75, - "links" : [] + "fontSize" : "100%", + "title" : "Disks Near Full", + "span" : 1, + "targets" : [ + { + "refId" : "A", + "textEditor" : true, + "target" : "aliasByNode(currentAbove(transformNull(keepLastValue(collectd.*.$domain.cephmetrics.gauge.$cluster_name.osd.*.osd_percent_used),0),$disk_full_threshold),1,-2)" + } + ], + "links" : [], + "sort" : { + "desc" : true, + "col" : 0 + }, + "type" : "table", + "pageSize" : null, + "minSpan" : 1 }, { - "type" : "table", - "hideTimeOverride" : true, - "fontSize" : "100%", "scroll" : true, + "showHeader" : true, + "columns" : [ + { + "text" : "Current", + "value" : "current" + } + ], + "id" : 71, + "title" : "OSD's Down", + "span" : 1, "targets" : [ { - "hide" : false, + "target" : "currentBelow(groupByNode(transformNull(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_state.*.up,99),-2,\"maxSeries\"),0.5)", + "textEditor" : true, "refId" : "B", - "target" : "currentBelow(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_state.*.up,-2,\"maxSeries\"),0.5)", - "textEditor" : true + "hide" : false } ], + "sort" : { + "col" : null, + "desc" : false + }, "pageSize" : 100, - "showHeader" : true, - "timeFrom" : "1m", - "transform" : "timeseries_aggregations", + "timeShift" : null, "styles" : [ { - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "unit" : "short", - "pattern" : "Metric", - "sanitize" : false, - "alias" : "OSD Id", "type" : "number", - "colorMode" : null, "thresholds" : [ "" ], + "decimals" : 0, + "colorMode" : null, + "unit" : "short", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "alias" : "OSD Id", + "sanitize" : false, + "pattern" : "Metric", "colors" : [ "rgba(50, 172, 45, 0.97)", "rgba(237, 129, 40, 0.89)", "rgba(245, 54, 54, 0.9)" - ], - "decimals" : 0 + ] }, { - "alias" : "Status", - "type" : "hidden", - "colorMode" : "cell", - "thresholds" : [ - "0" - ], "pattern" : "Current", - "unit" : "short", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "decimals" : 0, "colors" : [ "rgba(50, 172, 45, 0.97)", "rgba(237, 129, 40, 0.89)", "rgba(245, 54, 54, 0.9)" - ] + ], + "thresholds" : [ + "0" + ], + "type" : "hidden", + "alias" : "Status", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "colorMode" : "cell", + "decimals" : 0, + "unit" : "short" } ], - "sort" : { - "col" : null, - "desc" : false - }, - "id" : 71, + "timeFrom" : "1m", + "hideTimeOverride" : true, + "fontSize" : "100%", + "transform" : "timeseries_aggregations", "links" : [], - "columns" : [ - { - "text" : "Current", - "value" : "current" - } - ], - "title" : "OSD's Down", - "timeShift" : null, "minSpan" : 1, - "span" : 1 + "type" : "table" }, { - "hideTimeOverride" : true, - "type" : "table", "fontSize" : "100%", - "pageSize" : null, - "showHeader" : true, - "targets" : [ - { - "textEditor" : true, - "target" : "currentBelow(groupByNode(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_state.*.in,-2,\"minSeries\"),0.5)", - "refId" : "B", - "hide" : false - } - ], - "scroll" : true, "transform" : "timeseries_aggregations", - "timeFrom" : "5m", - "id" : 74, "links" : [], - "sort" : { - "col" : 0, - "desc" : true - }, + "minSpan" : 1, + "type" : "table", + "timeShift" : null, "styles" : [ { - "dateFormat" : "YYYY-MM-DD HH:mm:ss", "pattern" : "Time", "alias" : "Time", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", "type" : "date" }, { - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "unit" : "none", "pattern" : "Current", - "alias" : "", - "type" : "hidden", - "thresholds" : [], - "colorMode" : null, "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "decimals" : 0 + "colorMode" : null, + "decimals" : 0, + "unit" : "none", + "alias" : "", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "type" : "hidden", + "thresholds" : [] }, { "type" : "number", - "alias" : "OSD Id", "thresholds" : [], + "unit" : "short", + "decimals" : 2, "colorMode" : null, + "alias" : "OSD Id", "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "unit" : "short", - "pattern" : "Metric", "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" ], - "decimals" : 2 + "pattern" : "Metric" }, { - "pattern" : "/.*/", - "unit" : "short", - "colorMode" : null, - "thresholds" : [], - "type" : "number", - "alias" : "", - "decimals" : 2, "colors" : [ "rgba(245, 54, 54, 0.9)", "rgba(237, 129, 40, 0.89)", "rgba(50, 172, 45, 0.97)" - ] + ], + "pattern" : "/.*/", + "thresholds" : [], + "type" : "number", + "alias" : "", + "unit" : "short", + "colorMode" : null, + "decimals" : 2 } ], - "columns" : [ + "timeFrom" : "5m", + "hideTimeOverride" : true, + "id" : 74, + "title" : "OSDs Out", + "targets" : [ { - "text" : "Current", - "value" : "current" + "hide" : false, + "refId" : "B", + "target" : "currentBelow(groupByNode(transformNull(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.osd_state.*.in,99),-2,\"minSeries\"),0.5)", + "textEditor" : true } ], "span" : 1, - "timeShift" : null, - "title" : "OSDs Out", - "minSpan" : 1 + "sort" : { + "desc" : true, + "col" : 0 + }, + "pageSize" : null, + "scroll" : true, + "showHeader" : true, + "columns" : [ + { + "value" : "current", + "text" : "Current" + } + ] }, { - "title" : "", "minSpan" : 1, - "span" : 1, - "transparent" : true, - "mode" : "html", "type" : "text", "links" : [], + "title" : "", + "span" : 1, "id" : 73, - "content" : "" + "mode" : "html", + "content" : "", + "transparent" : true }, { - "columns" : [ - { - "value" : "current", - "text" : "Current" - } - ], - "links" : [], - "id" : 10, - "styles" : [ - { - "pattern" : "Time", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "type" : "date" - }, - { - "decimals" : 2, - "colors" : [ - "rgba(245, 54, 54, 0.9)", - "rgba(237, 129, 40, 0.89)", - "rgba(50, 172, 45, 0.97)" - ], - "pattern" : "Metric", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "unit" : "short", - "type" : "number", - "alias" : "Object State", - "colorMode" : null, - "thresholds" : [] - }, - { - "pattern" : "Current", - "unit" : "none", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "thresholds" : [], - "colorMode" : null, - "type" : "number", - "alias" : "Count", - "decimals" : 0, - "colors" : [ - "rgba(245, 54, 54, 0.9)", - "rgba(237, 129, 40, 0.89)", - "rgba(50, 172, 45, 0.97)" - ] - }, - { - "pattern" : "/.*/", - "unit" : "none", - "colorMode" : null, - "thresholds" : [], - "type" : "number", - "decimals" : 0, - "colors" : [ - "rgba(245, 54, 54, 0.9)", - "rgba(237, 129, 40, 0.89)", - "rgba(50, 172, 45, 0.97)" - ] - } - ], - "sort" : { - "col" : null, - "desc" : false - }, - "datasource" : "Local", - "span" : 4, - "filterNull" : false, "title" : "Object Summary", - "minSpan" : 3, - "fontSize" : "100%", - "type" : "table", - "transform" : "timeseries_aggregations", + "span" : 4, "targets" : [ { - "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_object), 'Total Objects')", - "dsType" : "influxdb", - "tags" : [], - "alias" : "Objects", - "refId" : "A", "select" : [ [ { @@ -1536,31 +1416,8 @@ } ] ], - "textEditor" : true, - "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object", - "policy" : "default", - "groupBy" : [ - { - "type" : "time", - "params" : [ - "$__interval" - ] - }, - { - "type" : "fill", - "params" : [ - "null" - ] - } - ], - "resultFormat" : "time_series" - }, - { - "refId" : "B", - "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_object_degraded), 'Objects degraded')", - "dsType" : "influxdb", - "tags" : [], - "alias" : "Objects", + "textEditor" : true, + "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_object), 'Total Objects')", "groupBy" : [ { "params" : [ @@ -1575,7 +1432,18 @@ "type" : "fill" } ], + "policy" : "default", + "dsType" : "influxdb", + "refId" : "A", + "alias" : "Objects", + "tags" : [], + "resultFormat" : "time_series", + "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object" + }, + { + "tags" : [], "resultFormat" : "time_series", + "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object", "select" : [ [ { @@ -1591,17 +1459,49 @@ ] ], "textEditor" : true, - "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object", - "policy" : "default" + "dsType" : "influxdb", + "groupBy" : [ + { + "params" : [ + "$__interval" + ], + "type" : "time" + }, + { + "params" : [ + "null" + ], + "type" : "fill" + } + ], + "policy" : "default", + "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_object_degraded), 'Objects degraded')", + "refId" : "B", + "alias" : "Objects" }, { - "dsType" : "influxdb", - "alias" : "Objects", + "resultFormat" : "time_series", + "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object", "tags" : [], - "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_object_misplaced), 'Objects misplaced')", "refId" : "C", - "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object", + "alias" : "Objects", + "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_object_misplaced), 'Objects misplaced')", "policy" : "default", + "dsType" : "influxdb", + "groupBy" : [ + { + "params" : [ + "$__interval" + ], + "type" : "time" + }, + { + "params" : [ + "null" + ], + "type" : "fill" + } + ], "select" : [ [ { @@ -1616,7 +1516,11 @@ } ] ], - "textEditor" : true, + "textEditor" : true + }, + { + "alias" : "Objects", + "refId" : "D", "groupBy" : [ { "type" : "time", @@ -1631,9 +1535,10 @@ "type" : "fill" } ], - "resultFormat" : "time_series" - }, - { + "policy" : "default", + "dsType" : "influxdb", + "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_object_unfound), 'Objects unfound')", + "textEditor" : true, "select" : [ [ { @@ -1648,104 +1553,172 @@ } ] ], - "textEditor" : true, - "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object", - "policy" : "default", - "groupBy" : [ - { - "params" : [ - "$__interval" - ], - "type" : "time" - }, - { - "params" : [ - "null" - ], - "type" : "fill" - } - ], "resultFormat" : "time_series", - "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_object_unfound), 'Objects unfound')", - "dsType" : "influxdb", - "alias" : "Objects", - "tags" : [], - "refId" : "D" + "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_object", + "tags" : [] } ], + "id" : 10, "pageSize" : null, + "sort" : { + "desc" : false, + "col" : null + }, "showHeader" : true, - "scroll" : true + "scroll" : true, + "columns" : [ + { + "text" : "Current", + "value" : "current" + } + ], + "filterNull" : false, + "links" : [], + "transform" : "timeseries_aggregations", + "fontSize" : "100%", + "type" : "table", + "minSpan" : 3, + "styles" : [ + { + "type" : "date", + "pattern" : "Time", + "dateFormat" : "YYYY-MM-DD HH:mm:ss" + }, + { + "thresholds" : [], + "type" : "number", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "alias" : "Object State", + "unit" : "short", + "decimals" : 2, + "colorMode" : null, + "colors" : [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "pattern" : "Metric" + }, + { + "type" : "number", + "thresholds" : [], + "unit" : "none", + "decimals" : 0, + "colorMode" : null, + "alias" : "Count", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "colors" : [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "pattern" : "Current" + }, + { + "thresholds" : [], + "type" : "number", + "pattern" : "/.*/", + "colors" : [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "colorMode" : null, + "decimals" : 0, + "unit" : "none" + } + ], + "datasource" : "Local" }, { + "minSpan" : 1, "type" : "text", - "content" : "", "links" : [], + "span" : 1, + "title" : "", "id" : 67, "mode" : "markdown", - "transparent" : true, - "minSpan" : 1, - "title" : "", - "span" : 1 + "content" : "", + "transparent" : true }, { - "showHeader" : true, - "pageSize" : null, - "targets" : [ + "minSpan" : 3, + "type" : "table", + "fontSize" : "100%", + "transform" : "timeseries_aggregations", + "links" : [], + "datasource" : "Local", + "styles" : [ { - "refId" : "A", - "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg), 'PGs')", - "dsType" : "influxdb", - "alias" : "PG's", - "tags" : [], - "groupBy" : [ - { - "params" : [ - "$__interval" - ], - "type" : "time" - }, - { - "type" : "fill", - "params" : [ - "null" - ] - } - ], - "resultFormat" : "time_series", - "select" : [ - [ - { - "params" : [ - "value" - ], - "type" : "field" - }, - { - "params" : [], - "type" : "mean" - } - ] + "pattern" : "Time", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "type" : "date" + }, + { + "decimals" : 2, + "colorMode" : null, + "unit" : "short", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "alias" : "PG State", + "type" : "number", + "thresholds" : [], + "pattern" : "Metric", + "colors" : [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ] + }, + { + "colors" : [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" ], - "textEditor" : true, - "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pg", - "policy" : "default" + "pattern" : "Current", + "alias" : "Count", + "dateFormat" : "YYYY-MM-DD HH:mm:ss", + "unit" : "none", + "decimals" : 0, + "colorMode" : null, + "thresholds" : [], + "type" : "number" }, { - "dsType" : "influxdb", - "alias" : "PG's", + "thresholds" : [], + "type" : "number", + "colors" : [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "pattern" : "/.*/", + "unit" : "none", + "colorMode" : null, + "decimals" : 0 + } + ], + "sort" : { + "desc" : false, + "col" : null + }, + "pageSize" : null, + "id" : 13, + "span" : 3, + "title" : "PG Summary", + "targets" : [ + { "tags" : [], - "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_active), 'Active PGs')", - "refId" : "B", "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pg", - "policy" : "default", + "resultFormat" : "time_series", + "textEditor" : true, "select" : [ [ { - "type" : "field", "params" : [ "value" - ] + ], + "type" : "field" }, { "params" : [], @@ -1753,7 +1726,8 @@ } ] ], - "textEditor" : true, + "dsType" : "influxdb", + "policy" : "default", "groupBy" : [ { "type" : "time", @@ -1768,9 +1742,14 @@ "type" : "fill" } ], - "resultFormat" : "time_series" + "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg), 'PGs')", + "refId" : "A", + "alias" : "PG's" }, { + "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_active), 'Active PGs')", + "policy" : "default", + "dsType" : "influxdb", "groupBy" : [ { "type" : "time", @@ -1779,15 +1758,13 @@ ] }, { + "type" : "fill", "params" : [ "null" - ], - "type" : "fill" + ] } ], - "resultFormat" : "time_series", - "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pg", - "policy" : "default", + "textEditor" : true, "select" : [ [ { @@ -1797,37 +1774,39 @@ "type" : "field" }, { - "type" : "mean", - "params" : [] + "params" : [], + "type" : "mean" } ] ], - "textEditor" : true, - "refId" : "C", - "dsType" : "influxdb", + "refId" : "B", "alias" : "PG's", "tags" : [], - "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_active_clean), 'Active+clean PGs')" + "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pg", + "resultFormat" : "time_series" }, { - "policy" : "default", + "tags" : [], + "resultFormat" : "time_series", "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pg", - "textEditor" : true, "select" : [ [ { - "type" : "field", "params" : [ "value" - ] + ], + "type" : "field" }, { - "type" : "mean", - "params" : [] + "params" : [], + "type" : "mean" } ] ], - "resultFormat" : "time_series", + "textEditor" : true, + "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_active_clean), 'Active+clean PGs')", + "dsType" : "influxdb", + "policy" : "default", "groupBy" : [ { "params" : [ @@ -1842,113 +1821,67 @@ ] } ], - "alias" : "PG's", - "tags" : [], - "dsType" : "influxdb", - "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_peering), 'PGs peering')", - "refId" : "D" - } - ], - "scroll" : true, - "transform" : "timeseries_aggregations", - "type" : "table", - "fontSize" : "100%", - "filterNull" : false, - "span" : 3, - "title" : "PG Summary", - "minSpan" : 3, - "datasource" : "Local", - "id" : 13, - "links" : [], - "sort" : { - "desc" : false, - "col" : null - }, - "styles" : [ - { - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "pattern" : "Time", - "type" : "date" + "refId" : "C", + "alias" : "PG's" }, { - "colors" : [ - "rgba(245, 54, 54, 0.9)", - "rgba(237, 129, 40, 0.89)", - "rgba(50, 172, 45, 0.97)" + "resultFormat" : "time_series", + "measurement" : "collectd.obj-mon-1.storage.lab.cephmetrics.gauge.ceph.mon.num_pg", + "tags" : [], + "alias" : "PG's", + "refId" : "D", + "textEditor" : true, + "select" : [ + [ + { + "type" : "field", + "params" : [ + "value" + ] + }, + { + "params" : [], + "type" : "mean" + } + ] ], - "decimals" : 2, - "thresholds" : [], - "colorMode" : null, - "type" : "number", - "alias" : "PG State", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "unit" : "short", - "pattern" : "Metric" - }, - { - "colorMode" : null, - "thresholds" : [], - "type" : "number", - "alias" : "Count", - "pattern" : "Current", - "unit" : "none", - "dateFormat" : "YYYY-MM-DD HH:mm:ss", - "decimals" : 0, - "colors" : [ - "rgba(245, 54, 54, 0.9)", - "rgba(237, 129, 40, 0.89)", - "rgba(50, 172, 45, 0.97)" - ] - }, - { - "decimals" : 0, - "type" : "number", - "thresholds" : [], - "colorMode" : null, - "colors" : [ - "rgba(245, 54, 54, 0.9)", - "rgba(237, 129, 40, 0.89)", - "rgba(50, 172, 45, 0.97)" + "groupBy" : [ + { + "type" : "time", + "params" : [ + "$__interval" + ] + }, + { + "params" : [ + "null" + ], + "type" : "fill" + } ], - "pattern" : "/.*/", - "unit" : "none" + "dsType" : "influxdb", + "policy" : "default", + "target" : "alias(maxSeries(collectd.*.$domain.cephmetrics.gauge.$cluster_name.mon.num_pg_peering), 'PGs peering')" } ], + "filterNull" : false, "columns" : [ { - "text" : "Current", - "value" : "current" + "value" : "current", + "text" : "Current" } - ] + ], + "scroll" : true, + "showHeader" : true } ], - "title" : "Storage Information", - "collapse" : true, - "repeatRowId" : null, - "height" : 250, - "repeat" : null + "titleSize" : "h5", + "repeatIteration" : null } ], "hideControls" : true, - "timezone" : "browser", - "refresh" : "10s", "title" : "Ceph Health", - "schemaVersion" : 14, - "graphTooltip" : 0, - "version" : 41, - "editable" : false, "timepicker" : { - "time_options" : [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ], "refresh_intervals" : [ "5s", "10s", @@ -1960,20 +1893,87 @@ "1h", "2h", "1d" + ], + "time_options" : [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "id" : 29, + "annotations" : { + "list" : [ + { + "type" : "alert", + "iconColor" : "rgba(255, 96, 96, 1)", + "showIn" : 0, + "enable" : true, + "datasource" : "Local", + "tags" : "health_alert", + "name" : "health_alert", + "limit" : 100, + "hide" : false + }, + { + "datasource" : "Local", + "tags" : "health_ok", + "enable" : true, + "name" : "health_ok", + "limit" : 100, + "hide" : false, + "type" : "alert", + "iconColor" : "rgb(1, 195, 0)", + "showIn" : 0 + } ] - } + }, + "schemaVersion" : 14, + "timezone" : "browser", + "graphTooltip" : 0, + "refresh" : "10s", + "version" : 43, + "editable" : false, + "links" : [ + { + "keepTime" : true, + "tags" : [ + "overview" + ], + "includeVars" : true, + "asDropdown" : true, + "targetBlank" : true, + "icon" : "external link", + "title" : "Shortcuts", + "type" : "dashboards" + } + ], + "style" : "dark", + "time" : { + "to" : "now", + "from" : "now-1h" + }, + "gnetId" : null, + "tags" : [ + "overview" + ] }, "meta" : { - "canEdit" : true, - "canSave" : true, - "slug" : "ceph-health", "updatedBy" : "admin", - "canStar" : true, + "canEdit" : true, "createdBy" : "admin", "type" : "db", - "updated" : "2017-08-19T21:14:18Z", + "canSave" : true, + "updated" : "2017-08-21T03:34:51Z", "expires" : "0001-01-01T00:00:00Z", + "canStar" : true, + "version" : 43, "created" : "2017-08-08T03:07:37Z", - "version" : 41 + "slug" : "ceph-health" } }