diff --git a/grafana/templates/configmap-dashboards.yaml b/grafana/templates/configmap-dashboards.yaml new file mode 100644 index 000000000..4daed2e85 --- /dev/null +++ b/grafana/templates/configmap-dashboards.yaml @@ -0,0 +1,27 @@ +{{/* +Copyright 2020 The Openstack-Helm Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/}} + +{{- if .Values.manifests.configmap_dashboards }} +--- +apiVersion: v1 +kind: ConfigMap +metadata: + name: grafana-dashboards +data: +{{ range $key, $value := .Values.conf.dashboards }} + {{$key}}.json: {{ $value | toJson }} +{{ end }} +{{- end }} diff --git a/grafana/templates/configmap-etc.yaml b/grafana/templates/configmap-etc.yaml index 472c6cb6c..98c186b9f 100644 --- a/grafana/templates/configmap-etc.yaml +++ b/grafana/templates/configmap-etc.yaml @@ -41,7 +41,4 @@ data: {{ if not (empty .Values.conf.ldap) }} {{- include "helm-toolkit.snippets.values_template_renderer" (dict "envAll" $envAll "template" .Values.conf.ldap.template "key" "ldap.toml" "format" "Secret") | indent 2 }} {{ end }} -{{ range $key, $value := .Values.conf.dashboards }} - {{$key}}.json: {{ toJson $value | b64enc }} -{{ end }} {{- end }} diff --git a/grafana/templates/deployment.yaml b/grafana/templates/deployment.yaml index e5e604b7d..b26451ffa 100644 --- a/grafana/templates/deployment.yaml +++ b/grafana/templates/deployment.yaml @@ -116,7 +116,7 @@ spec: - name: data mountPath: /var/lib/grafana/data {{- range $key, $value := .Values.conf.dashboards }} - - name: grafana-etc + - name: grafana-dashboards mountPath: /etc/grafana/dashboards/{{$key}}.json subPath: {{$key}}.json {{- end }} @@ -140,6 +140,10 @@ spec: secret: secretName: grafana-etc defaultMode: 0444 + - name: grafana-dashboards + configMap: + name: grafana-dashboards + defaultMode: 0555 - name: data emptyDir: {} {{ if $mounts_grafana.volumes }}{{ toYaml $mounts_grafana.volumes | indent 8 }}{{ end }} diff --git a/grafana/values.yaml b/grafana/values.yaml index 6ae93a934..022f0ffdd 100644 --- a/grafana/values.yaml +++ b/grafana/values.yaml @@ -386,6 +386,7 @@ secrets: manifests: configmap_bin: true configmap_etc: true + configmap_dashboards: true deployment: true ingress: true helm_tests: true diff --git a/grafana/values_overrides/calico.yaml b/grafana/values_overrides/calico.yaml index 109b7826b..2543d58b2 100644 --- a/grafana/values_overrides/calico.yaml +++ b/grafana/values_overrides/calico.yaml @@ -2,1049 +2,1358 @@ # the Calico CNI conf: dashboards: - calico: - __inputs: - - name: prometheus - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 5.0.0 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - annotations: - list: - - builtIn: 1 - datasource: "-- Grafana --" - enable: true - hide: true - iconColor: rgba(0, 211, 255, 1) - name: Annotations & Alerts - type: dashboard - description: Calico cluster monitoring dashboard - editable: false - gnetId: 3244 - graphTooltip: 0 - id: - links: [] - panels: - - collapsed: false - gridPos: - h: 1 - w: 24 - x: 0 - 'y': 0 - id: 15 - panels: [] - repeat: - title: Felix - type: row - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 1 - id: 1 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_active_local_endpoints - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active Local Endpoints - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 1 - id: 3 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_active_local_policies - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active Local Policies - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 8 - id: 2 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_active_local_selectors - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active Local Selectors - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 8 - id: 4 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_active_local_tags - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active Local Tags - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 15 - id: 5 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_cluster_num_host_endpoints - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Cluster Host Endpoints - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 15 - id: 6 - legend: - alignAsTable: true - avg: false - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_cluster_num_workload_endpoints - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Cluster Workload Endpoints - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 22 - id: 7 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_cluster_num_hosts - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Clusters Hosts - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 22 - id: 8 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_ipsets_calico - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active IP Sets - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 29 - id: 9 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_iptables_chains - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active IP Tables Chains - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 29 - id: 10 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_ipset_errors - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: IP Set Command Failures - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 36 - id: 11 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_iptables_save_errors - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: IP Tables Save Errors - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 36 - id: 12 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_iptables_restore_errors - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: IP Tables Restore Errors - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 43 - id: 13 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_resyncs_started - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Felix Resyncing Datastore - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 43 - id: 14 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_int_dataplane_failures - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Dataplane failed updates - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - refresh: 5m - schemaVersion: 16 - style: dark - tags: - - calico - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: utc - title: Kubernetes Calico - version: 2 + calico: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Calico cluster monitoring dashboard", + "overwrite": true, + "editable": false, + "gnetId": 3244, + "graphTooltip": 0, + "id": 38, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "true": 0, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 15, + "panels": [], + "repeat": null, + "title": "Felix", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 1, + "w": 12, + "x": 0, + "y": 1 + }, + "id": 1, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_active_local_endpoints", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Local Endpoints", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 1, + "w": 12, + "x": 12, + "y": 1 + }, + "id": 3, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_active_local_policies", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Local Policies", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 8, + "w": 12, + "x": 0, + "y": 8 + }, + "id": 2, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_active_local_selectors", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Local Selectors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 8, + "w": 12, + "x": 12, + "y": 8 + }, + "id": 4, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_active_local_tags", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Local Tags", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 15, + "w": 12, + "x": 0, + "y": 15 + }, + "id": 5, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_cluster_num_host_endpoints", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Host Endpoints", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 15, + "w": 12, + "x": 12, + "y": 15 + }, + "id": 6, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_cluster_num_workload_endpoints", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Workload Endpoints", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 22, + "w": 12, + "x": 0, + "y": 22 + }, + "id": 7, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_cluster_num_hosts", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Clusters Hosts", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 22, + "w": 12, + "x": 12, + "y": 22 + }, + "id": 8, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_ipsets_calico", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active IP Sets", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 29, + "w": 12, + "x": 0, + "y": 29 + }, + "id": 9, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_iptables_chains", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active IP Tables Chains", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 29, + "w": 12, + "x": 12, + "y": 29 + }, + "id": 10, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_ipset_errors", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "IP Set Command Failures", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 36, + "w": 12, + "x": 0, + "y": 36 + }, + "id": 11, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_iptables_save_errors", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "IP Tables Save Errors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 36, + "w": 12, + "x": 12, + "y": 36 + }, + "id": 12, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_iptables_restore_errors", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "IP Tables Restore Errors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 43, + "w": 12, + "x": 0, + "y": 43 + }, + "id": 13, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_resyncs_started", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Felix Resyncing Datastore", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 43, + "w": 12, + "x": 12, + "y": 43 + }, + "id": 14, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_int_dataplane_failures", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Dataplane failed updates", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "calico" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Kubernetes Calico", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/ceph.yaml b/grafana/values_overrides/ceph.yaml index 358e33067..562929921 100644 --- a/grafana/values_overrides/ceph.yaml +++ b/grafana/values_overrides/ceph.yaml @@ -3,2485 +3,3672 @@ # status of ceph pools for those clusters conf: dashboards: - ceph_cluster: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: Prometheus.IO - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: panel - id: graph - name: Graph - version: '' - - type: grafana - id: grafana - name: Grafana - version: 3.1.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - id: - title: Ceph - Cluster - tags: - - ceph - - cluster - style: dark - timezone: browser - editable: true - hideControls: false - sharedCrosshair: false - rows: - - collapse: false - editable: true - height: 150px - panels: - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 21 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: ceph_health_status{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '1,1' - title: Status - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - - op: "=" - text: HEALTHY - value: '0' - - op: "=" - text: WARNING - value: '1' - - op: "=" - text: CRITICAL - value: '2' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 22 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: count(ceph_pool_max_avail{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '' - title: Pools - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 33 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: 0.025,0.1 - title: Cluster Capacity - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 34 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: ceph_cluster_total_used_bytes{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: 0.025,0.1 - title: Used Capacity - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percentunit - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 23 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: ceph_cluster_total_used_bytes/ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '70,80' - title: Current Utilization - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - title: New row - - collapse: false - editable: true - height: 100px - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 26 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum(ceph_osd_in{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '' - title: OSDs IN - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 40, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 27 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"}) - sum(ceph_osd_in{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '1,1' - title: OSDs OUT - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 28 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum(ceph_osd_up{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '' - title: OSDs UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 40, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 29 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"}) - sum(ceph_osd_up{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '1,1' - title: OSDs DOWN - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 30 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: avg(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '250,300' - title: Average PGs per OSD - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - title: New row - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: - Available: "#EAB839" - Total Capacity: "#447EBC" - Used: "#BF1B00" - total_avail: "#6ED0E0" - total_space: "#7EB26D" - total_used: "#890F02" - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 4 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '300' - id: 1 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 0 - links: [] - minSpan: - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: Total Capacity - fill: 0 - linewidth: 3 - stack: false - span: 4 - stack: true - steppedLine: false - targets: - - expr: ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"} - ceph_cluster_total_used_bytes{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Available - refId: A - step: 60 - - expr: ceph_cluster_total_used_bytes - interval: "$interval" - intervalFactor: 1 - legendFormat: Used - refId: B - step: 60 - - expr: ceph_cluster_total_bytes - interval: "$interval" - intervalFactor: 1 - legendFormat: Total Capacity - refId: C - step: 60 - timeFrom: - timeShift: - title: Capacity - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Total Capacity: "#7EB26D" - Used: "#BF1B00" - total_avail: "#6ED0E0" - total_space: "#7EB26D" - total_used: "#890F02" - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - thresholdLine: false - height: '300' - id: 3 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - minSpan: - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: true - steppedLine: false - targets: - - expr: sum(ceph_osd_op_w{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Write - refId: A - step: 60 - - expr: sum(ceph_osd_op_r{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Read - refId: B - step: 60 - timeFrom: - timeShift: - title: IOPS - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: none - label: '' - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '300' - id: 7 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: true - steppedLine: false - targets: - - expr: sum(ceph_osd_op_in_bytes{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Write - refId: A - step: 60 - - expr: sum(ceph_osd_op_out_bytes{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Read - refId: B - step: 60 - timeFrom: - timeShift: - title: Throughput - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - repeat: - showTitle: true - title: CLUSTER - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 18 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Total.*$/" - stack: false - span: 12 - stack: true - steppedLine: false - targets: - - expr: ceph_cluster_total_objects{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Total - refId: A - step: 60 - timeFrom: - timeShift: - title: Objects in the Cluster - tooltip: - msResolution: false - shared: true - sort: 1 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 19 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Total.*$/" - stack: false - span: 6 - stack: true - steppedLine: false - targets: - - expr: sum(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Total - refId: A - step: 60 - - expr: sum(ceph_pg_active{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Active - refId: B - step: 60 - - expr: sum(ceph_pg_inconsistent{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Inconsistent - refId: C - step: 60 - - expr: sum(ceph_pg_creating{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Creating - refId: D - step: 60 - - expr: sum(ceph_pg_recovering{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Recovering - refId: E - step: 60 - - expr: sum(ceph_pg_down{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Down - refId: F - step: 60 - timeFrom: - timeShift: - title: PGs - tooltip: - msResolution: false - shared: true - sort: 1 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 20 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Total.*$/" - stack: false - span: 6 - stack: true - steppedLine: false - targets: - - expr: sum(ceph_pg_degraded{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Degraded - refId: A - step: 60 - - expr: sum(ceph_pg_stale{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Stale - refId: B - step: 60 - - expr: sum(ceph_pg_undersized{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Undersized - refId: C - step: 60 - timeFrom: - timeShift: - title: Stuck PGs - tooltip: - msResolution: false - shared: true - sort: 1 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - title: New row - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: {} - hide: 0 - label: Cluster - name: ceph_cluster - options: [] - type: query - query: label_values(ceph_health_status, release_group) - refresh: 1 - sort: 2 - datasource: "${DS_PROMETHEUS}" - - auto: true - auto_count: 10 - auto_min: 1m - current: - tags: [] - text: 1m - value: 1m - datasource: - hide: 0 - includeAll: false - label: Interval - multi: false - name: interval - options: - - selected: false - text: auto - value: "$__auto_interval" - - selected: true - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 0 - type: interval - annotations: - list: [] - refresh: 5m - schemaVersion: 12 - version: 26 - links: [] - gnetId: 917 - description: "Ceph Cluster overview.\r\n" - ceph_osd: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: Prometheus.IO - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: panel - id: graph - name: Graph - version: '' - - type: grafana - id: grafana - name: Grafana - version: 3.1.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - id: - title: Ceph - OSD - tags: - - ceph - - osd - style: dark - timezone: browser - editable: true - hideControls: false - sharedCrosshair: false - rows: - - collapse: false - editable: true - height: 100px - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 40, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 6 - interval: - isNew: true - links: [] - mappingType: 2 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - - from: '0' - text: DOWN - to: '0.99' - - from: '0.99' - text: UP - to: '1' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: ceph_osd_up{ceph_daemon="$osd",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '0,1' - timeFrom: - title: Status - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: DOWN - value: '0' - - op: "=" - text: UP - value: '1' - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 40, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 8 - interval: - isNew: true - links: [] - mappingType: 2 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - - from: '0' - text: OUT - to: '0.99' - - from: '0.99' - text: IN - to: '1' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: ceph_osd_in{ceph_daemon="$osd",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '0,1' - timeFrom: - title: Available - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: DOWN - value: '0' - - op: "=" - text: UP - value: '1' - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 10 - interval: - isNew: true - links: [] - mappingType: 2 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: count(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '0,1' - timeFrom: - title: Total OSDs - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: DOWN - value: '0' - - op: "=" - text: UP - value: '1' - - op: "=" - text: N/A - value: 'null' - valueName: current - title: New row - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: 250 - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: 300 - threshold2Color: rgba(234, 112, 112, 0.22) - thresholdLine: true - id: 5 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Average.*/" - fill: 0 - stack: false - span: 10 - stack: true - steppedLine: false - targets: - - expr: ceph_osd_numpg{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Number of PGs - {{ $osd }} - refId: A - step: 60 - - expr: avg(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Average Number of PGs in the Cluster - refId: B - step: 60 - timeFrom: - timeShift: - title: PGs - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 7 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: (ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}/ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"})*100 - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '60,80' - timeFrom: - title: Utilization - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - showTitle: true - title: 'OSD: $osd' - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 2 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: true - steppedLine: false - targets: - - expr: ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Used - {{ osd.$osd }} - metric: ceph_osd_used_bytes - refId: A - step: 60 - - expr: ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - hide: false - interval: "$interval" - intervalFactor: 1 - legendFormat: Available - {{ $osd }} - metric: ceph_osd_avail_bytes - refId: B - step: 60 - timeFrom: - timeShift: - title: OSD Storage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 5 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 9 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: false - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 2 - points: true - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: (ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}/ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Available - {{ $osd }} - metric: ceph_osd_avail_bytes - refId: A - step: 60 - timeFrom: - timeShift: - title: Utilization Variance - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: none - label: - logBase: 1 - max: - min: - show: true - - format: none - label: - logBase: 1 - max: - min: - show: true - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: {} - hide: 0 - label: Cluster - name: ceph_cluster - options: [] - type: query - query: label_values(ceph_health_status, release_group) - refresh: 1 - sort: 2 - datasource: "${DS_PROMETHEUS}" - - auto: true - auto_count: 10 - auto_min: 1m - current: - selected: true - text: 1m - value: 1m - datasource: - hide: 0 - includeAll: false - label: Interval - multi: false - name: interval - options: - - selected: false - text: auto - value: "$__auto_interval" - - selected: true - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 0 - type: interval - - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: OSD - multi: false - name: osd - options: [] - query: label_values(ceph_osd_metadata{release_group="$ceph_cluster"}, ceph_daemon) - refresh: 1 - regex: '' - type: query - annotations: - list: [] - refresh: 15m - schemaVersion: 12 - version: 18 - links: [] - gnetId: 923 - description: CEPH OSD Status. - ceph_pool: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: Prometheus.IO - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: panel - id: graph - name: Graph - version: '' - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: grafana - id: grafana - name: Grafana - version: 3.1.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - id: - title: Ceph - Pools - tags: - - ceph - - pools - style: dark - timezone: browser - editable: true - hideControls: false - sharedCrosshair: false - rows: - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 4 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 2 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - rightSide: true - show: true - total: false - values: true - lines: true - linewidth: 0 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Total.*$/" - fill: 0 - linewidth: 4 - stack: false - - alias: "/^Raw.*$/" - color: "#BF1B00" - fill: 0 - linewidth: 4 - span: 10 - stack: true - steppedLine: false - targets: - - expr: ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Total - {{ $pool }} - refId: A - step: 60 - - expr: ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Used - {{ $pool }} - refId: B - step: 60 - - expr: ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Available - {{ $pool }} - refId: C - step: 60 - - expr: ceph_pool_raw_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Raw - {{ $pool }} - refId: D - step: 60 - timeFrom: - timeShift: - title: "[[pool_name]] Pool Storage" - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: percentunit - gauge: - maxValue: 1 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 10 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: (ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} / ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '' - title: "[[pool_name]] Pool Usage" - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - showTitle: true - title: 'Pool: $pool' - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 7 - isNew: true - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: ceph_pool_objects{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Objects - {{ $pool_name }} - refId: A - step: 60 - - expr: ceph_pool_dirty{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Dirty Objects - {{ $pool_name }} - refId: B - step: 60 - timeFrom: - timeShift: - title: Objects in Pool [[pool_name]] - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - thresholdLine: false - id: 4 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: true - steppedLine: false - targets: - - expr: irate(ceph_pool_rd{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}[3m]) - interval: "$interval" - intervalFactor: 1 - legendFormat: Read - {{ $pool_name }} - refId: B - step: 60 - - expr: irate(ceph_pool_wr{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}[3m]) - interval: "$interval" - intervalFactor: 1 - legendFormat: Write - {{ $pool_name }} - refId: A - step: 60 - timeFrom: - timeShift: - title: "[[pool_name]] Pool IOPS" - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: none - label: IOPS - logBase: 1 - max: - min: 0 - show: true - - format: short - label: IOPS - logBase: 1 - max: - min: 0 - show: false - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 5 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: true - steppedLine: false - targets: - - expr: irate(ceph_pool_rd_bytes{pool_id="$pool",application="ceph",release_group="$ceph_cluster"}[3m]) - interval: "$interval" - intervalFactor: 1 - legendFormat: Read Bytes - {{ $pool_name }} - refId: A - step: 60 - - expr: irate(ceph_pool_wr_bytes{pool_id="$pool",application="ceph",release_group="$ceph_cluster"}[3m]) - interval: "$interval" - intervalFactor: 1 - legendFormat: Written Bytes - {{ $pool_name }} - refId: B - step: 60 - timeFrom: - timeShift: - title: "[[pool_name]] Pool Throughput" - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: 0 - show: true - - format: Bps - label: - logBase: 1 - max: - min: 0 - show: true - title: New row - time: - from: now-3h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: {} - hide: 0 - label: Cluster - name: ceph_cluster - options: [] - type: query - query: label_values(ceph_health_status, release_group) - refresh: 1 - sort: 2 - datasource: "${DS_PROMETHEUS}" - - auto: true - auto_count: 10 - auto_min: 1m - current: - selected: true - text: 1m - value: 1m - datasource: - hide: 0 - includeAll: false - label: Interval - multi: false - name: interval - options: - - selected: false - text: auto - value: "$__auto_interval" - - selected: true - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 0 - type: interval - - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Pool - multi: false - name: pool - options: [] - query: label_values(ceph_pool_objects{release_group="$ceph_cluster"}, pool_id) - refresh: 1 - regex: '' - type: query - - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Pool - multi: false - name: pool_name - options: [] - query: label_values(ceph_pool_metadata{release_group="$ceph_cluster",pool_id="[[pool]]" }, name) - refresh: 1 - regex: '' - type: query - annotations: - list: [] - refresh: 5m - schemaVersion: 12 - version: 22 - links: [] - gnetId: 926 - description: Ceph Pools dashboard. + ceph_cluster: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "Prometheus.IO", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "3.1.1" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Ceph Cluster overview.\r\n", + "overwrite": true, + "editable": false, + "gnetId": 917, + "graphTooltip": 0, + "id": 14, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 35, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 21, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "ceph_health_status{application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "1,1", + "title": "Status", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + }, + { + "op": "=", + "text": "HEALTHY", + "value": "0" + }, + { + "op": "=", + "text": "WARNING", + "value": "1" + }, + { + "op": "=", + "text": "CRITICAL", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 22, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "count(ceph_pool_max_avail{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "", + "title": "Pools", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 8, + "y": 1 + }, + "id": 33, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "0.025,0.1", + "title": "Cluster Capacity", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 12, + "y": 1 + }, + "id": 34, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "ceph_cluster_total_used_bytes{application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "0.025,0.1", + "title": "Used Capacity", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percentunit", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 16, + "y": 1 + }, + "id": 23, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "ceph_cluster_total_used_bytes/ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "70,80", + "title": "Current Utilization", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 5 + }, + "id": 36, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 0, + "y": 6 + }, + "id": 26, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ceph_osd_in{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "", + "title": "OSDs IN", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 40, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 2, + "y": 6 + }, + "id": 27, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\"}) - sum(ceph_osd_in{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "1,1", + "title": "OSDs OUT", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 4, + "y": 6 + }, + "id": 28, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ceph_osd_up{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "", + "title": "OSDs UP", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 40, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 6, + "y": 6 + }, + "id": 29, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\"}) - sum(ceph_osd_up{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "1,1", + "title": "OSDs DOWN", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 8, + "y": 6 + }, + "id": 30, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "avg(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "250,300", + "title": "Average PGs per OSD", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 9 + }, + "id": 37, + "panels": [], + "repeat": null, + "title": "CLUSTER", + "type": "row" + }, + { + "aliasColors": { + "Available": "#EAB839", + "Total Capacity": "#447EBC", + "Used": "#BF1B00", + "total_avail": "#6ED0E0", + "total_space": "#7EB26D", + "total_used": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 4, + "grid": {}, + "gridPos": { + "h": 8, + "w": 8, + "x": 0, + "y": 10 + }, + "height": "300", + "id": 1, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 0, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "Total Capacity", + "fill": 0, + "linewidth": 3, + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\"} - ceph_cluster_total_used_bytes{application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Available", + "refId": "A", + "step": 60 + }, + { + "expr": "ceph_cluster_total_used_bytes", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Used", + "refId": "B", + "step": 60 + }, + { + "expr": "ceph_cluster_total_bytes", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Total Capacity", + "refId": "C", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Capacity", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Total Capacity": "#7EB26D", + "Used": "#BF1B00", + "total_avail": "#6ED0E0", + "total_space": "#7EB26D", + "total_used": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 8, + "w": 8, + "x": 8, + "y": 10 + }, + "height": "300", + "id": 3, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_osd_op_w{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Write", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(ceph_osd_op_r{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Read", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "IOPS", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 8, + "w": 8, + "x": 16, + "y": 10 + }, + "height": "300", + "id": 7, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_osd_op_in_bytes{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Write", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(ceph_osd_op_out_bytes{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Read", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Throughput", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 18 + }, + "id": 38, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 19 + }, + "id": 18, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Total.*$/", + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_cluster_total_objects{application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Total", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Objects in the Cluster", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 26 + }, + "id": 19, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Total.*$/", + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Total", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(ceph_pg_active{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Active", + "refId": "B", + "step": 60 + }, + { + "expr": "sum(ceph_pg_inconsistent{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Inconsistent", + "refId": "C", + "step": 60 + }, + { + "expr": "sum(ceph_pg_creating{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Creating", + "refId": "D", + "step": 60 + }, + { + "expr": "sum(ceph_pg_recovering{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Recovering", + "refId": "E", + "step": 60 + }, + { + "expr": "sum(ceph_pg_down{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Down", + "refId": "F", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "PGs", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 26 + }, + "id": 20, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Total.*$/", + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_pg_degraded{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Degraded", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(ceph_pg_stale{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Stale", + "refId": "B", + "step": 60 + }, + { + "expr": "sum(ceph_pg_undersized{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Undersized", + "refId": "C", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Stuck PGs", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "ceph", + "cluster" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Cluster", + "multi": false, + "name": "ceph_cluster", + "options": [], + "query": "label_values(ceph_health_status, release_group)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "auto": true, + "auto_count": 10, + "auto_min": "1m", + "current": { + "text": "1m", + "value": "1m" + }, + "datasource": null, + "hide": 0, + "includeAll": false, + "label": "Interval", + "multi": false, + "name": "interval", + "options": [ + { + "selected": false, + "text": "auto", + "value": "$__auto_interval_interval" + }, + { + "selected": true, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Ceph - Cluster", + "version": 1 + } + ceph_osd: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "Prometheus.IO", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "3.1.1" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "CEPH OSD Status.", + "overwrite": true, + "editable": true, + "gnetId": 923, + "graphTooltip": 0, + "id": 17, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 11, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 40, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 0, + "y": 1 + }, + "id": 6, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + }, + { + "from": "0", + "text": "DOWN", + "to": "0.99" + }, + { + "from": "0.99", + "text": "UP", + "to": "1" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "ceph_osd_up{ceph_daemon=\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "0,1", + "timeFrom": null, + "title": "Status", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "DOWN", + "value": "0" + }, + { + "op": "=", + "text": "UP", + "value": "1" + }, + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 40, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 2, + "y": 1 + }, + "id": 8, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + }, + { + "from": "0", + "text": "OUT", + "to": "0.99" + }, + { + "from": "0.99", + "text": "IN", + "to": "1" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "ceph_osd_in{ceph_daemon=\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "0,1", + "timeFrom": null, + "title": "Available", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "DOWN", + "value": "0" + }, + { + "op": "=", + "text": "UP", + "value": "1" + }, + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 4, + "y": 1 + }, + "id": 10, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "count(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "0,1", + "timeFrom": null, + "title": "Total OSDs", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "DOWN", + "value": "0" + }, + { + "op": "=", + "text": "UP", + "value": "1" + }, + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 4 + }, + "id": 12, + "panels": [], + "title": "OSD: $osd", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 20, + "x": 0, + "y": 5 + }, + "id": 5, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Average.*/", + "fill": 0, + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_osd_numpg{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Number of PGs - {{ $osd }}", + "refId": "A", + "step": 60 + }, + { + "expr": "avg(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Average Number of PGs in the Cluster", + "refId": "B", + "step": 60 + } + ], + "thresholds": [ + { + "colorMode": "custom", + "line": true, + "lineColor": "rgba(216, 200, 27, 0.27)", + "op": "gt", + "value": 250 + }, + { + "colorMode": "custom", + "line": true, + "lineColor": "rgba(234, 112, 112, 0.22)", + "op": "gt", + "value": 300 + } + ], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "PGs", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 20, + "y": 5 + }, + "id": 7, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "(ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"}/ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"})*100", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "60,80", + "timeFrom": null, + "title": "Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 12 + }, + "id": 13, + "panels": [], + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 13 + }, + "id": 2, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Used - {{ osd.$osd }}", + "metric": "ceph_osd_used_bytes", + "refId": "A", + "step": 60 + }, + { + "expr": "ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"} - ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "hide": false, + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Available - {{ $osd }}", + "metric": "ceph_osd_avail_bytes", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "OSD Storage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 5, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 13 + }, + "id": 9, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": false, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": true, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "(ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"}/ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\"})", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Available - {{ $osd }}", + "metric": "ceph_osd_avail_bytes", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Utilization Variance", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "15m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "ceph", + "osd" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": { + "text": "clcp-ucp-ceph-client", + "value": "clcp-ucp-ceph-client" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Cluster", + "multi": false, + "name": "ceph_cluster", + "options": [], + "query": "label_values(ceph_health_status, release_group)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "auto": true, + "auto_count": 10, + "auto_min": "1m", + "current": { + "text": "1m", + "value": "1m" + }, + "datasource": null, + "hide": 0, + "includeAll": false, + "label": "Interval", + "multi": false, + "name": "interval", + "options": [ + { + "selected": false, + "text": "auto", + "value": "$__auto_interval_interval" + }, + { + "selected": true, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + }, + { + "allValue": null, + "current": { + "text": "osd.0", + "value": "osd.0" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "OSD", + "multi": false, + "name": "osd", + "options": [], + "query": "label_values(ceph_osd_metadata{release_group=\"$ceph_cluster\"}, ceph_daemon)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Ceph - OSD", + "version": 1 + } + ceph_pool: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "Prometheus.IO", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "3.1.1" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Ceph Pools dashboard.", + "overwrite": true, + "editable": false, + "gnetId": 926, + "graphTooltip": 0, + "id": 2, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 11, + "panels": [], + "title": "Pool: $pool", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 4, + "grid": {}, + "gridPos": { + "h": 7, + "w": 20, + "x": 0, + "y": 1 + }, + "height": "", + "id": 2, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 0, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Total.*$/", + "fill": 0, + "linewidth": 4, + "stack": false + }, + { + "alias": "/^Raw.*$/", + "color": "#BF1B00", + "fill": 0, + "linewidth": 4 + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Total - {{ $pool }}", + "refId": "A", + "step": 60 + }, + { + "expr": "ceph_pool_bytes_used{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Used - {{ $pool }}", + "refId": "B", + "step": 60 + }, + { + "expr": "ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"} - ceph_pool_bytes_used{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Available - {{ $pool }}", + "refId": "C", + "step": 60 + }, + { + "expr": "ceph_pool_raw_bytes_used{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Raw - {{ $pool }}", + "refId": "D", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "[[pool_name]] Pool Storage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "percentunit", + "gauge": { + "maxValue": 1, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 20, + "y": 1 + }, + "id": 10, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(ceph_pool_bytes_used{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"} / ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "", + "title": "[[pool_name]] Pool Usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 12, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 9 + }, + "height": "", + "id": 7, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_pool_objects{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Objects - {{ $pool_name }}", + "refId": "A", + "step": 60 + }, + { + "expr": "ceph_pool_dirty{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Dirty Objects - {{ $pool_name }}", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Objects in Pool [[pool_name]]", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 9 + }, + "id": 4, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "irate(ceph_pool_rd{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}[3m])", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Read - {{ $pool_name }}", + "refId": "B", + "step": 60 + }, + { + "expr": "irate(ceph_pool_wr{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}[3m])", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Write - {{ $pool_name }}", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "[[pool_name]] Pool IOPS", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "IOPS", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": "IOPS", + "logBase": 1, + "max": null, + "min": 0, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 16 + }, + "id": 5, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "irate(ceph_pool_rd_bytes{pool_id=\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}[3m])", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Read Bytes - {{ $pool_name }}", + "refId": "A", + "step": 60 + }, + { + "expr": "irate(ceph_pool_wr_bytes{pool_id=\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\"}[3m])", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Written Bytes - {{ $pool_name }}", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "[[pool_name]] Pool Throughput", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "ceph", + "pools" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": { + "text": "clcp-ucp-ceph-client", + "value": "clcp-ucp-ceph-client" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Cluster", + "multi": false, + "name": "ceph_cluster", + "options": [], + "query": "label_values(ceph_health_status, release_group)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "auto": true, + "auto_count": 10, + "auto_min": "1m", + "current": { + "text": "1m", + "value": "1m" + }, + "datasource": null, + "hide": 0, + "includeAll": false, + "label": "Interval", + "multi": false, + "name": "interval", + "options": [ + { + "selected": false, + "text": "auto", + "value": "$__auto_interval_interval" + }, + { + "selected": true, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + }, + { + "allValue": null, + "current": { + "text": "1", + "value": "1" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Pool", + "multi": false, + "name": "pool", + "options": [], + "query": "label_values(ceph_pool_objects{release_group=\"$ceph_cluster\"}, pool_id)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + "text": "rbd", + "value": "rbd" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Pool", + "multi": false, + "name": "pool_name", + "options": [], + "query": "label_values(ceph_pool_metadata{release_group=\"$ceph_cluster\",pool_id=\"[[pool]]\" }, name)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Ceph - Pools", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/containers.yaml b/grafana/values_overrides/containers.yaml index c2b019f2c..12037cead 100644 --- a/grafana/values_overrides/containers.yaml +++ b/grafana/values_overrides/containers.yaml @@ -2,1699 +2,2102 @@ # container metrics, specific to each host conf: dashboards: - containers: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: panel - id: graph - name: Graph - version: '' - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: grafana - id: grafana - name: Grafana - version: 3.1.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.3.0 - id: - title: Container Metrics (cAdvisor) - description: Monitors Kubernetes cluster using Prometheus. Shows overall cluster CPU - / Memory / Filesystem usage as well as individual pod, containers, systemd services - statistics. Uses cAdvisor metrics only. - tags: - - kubernetes - style: dark - timezone: browser - editable: true - hideControls: false - sharedCrosshair: false - rows: - - collapse: false - editable: true - height: 200px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - thresholdLine: false - height: 200px - id: 32 - isNew: true - legend: - alignAsTable: false - avg: true - current: true - max: false - min: false - rightSide: false - show: false - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum (rate (container_network_receive_bytes_total{kubernetes_io_hostname=~"^$Node$"}[5m])) - interval: 10s - intervalFactor: 1 - legendFormat: Received - metric: network - refId: A - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{kubernetes_io_hostname=~"^$Node$"}[5m]))' - interval: 10s - intervalFactor: 1 - legendFormat: Sent - metric: network - refId: B - step: 10 - timeFrom: - timeShift: - title: Network I/O pressure - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: - show: true - - format: Bps - label: - logBase: 1 - max: - min: - show: false - title: Network I/O pressure - - collapse: false - editable: true - height: 250px - panels: - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - height: 180px - id: 4 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_memory_working_set_bytes{id="/",kubernetes_io_hostname=~"^$Node$"}) - / sum (machine_memory_bytes{kubernetes_io_hostname=~"^$Node$"}) * 100 - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: 65, 90 - title: Cluster memory usage - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - height: 180px - id: 6 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{id="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - / sum (machine_cpu_cores{kubernetes_io_hostname=~"^$Node$"}) * 100 - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: 65, 90 - title: Cluster CPU usage (5m avg) - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - height: 180px - id: 7 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_fs_usage_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"}) - / sum (container_fs_limit_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"}) - * 100 - interval: 10s - intervalFactor: 1 - legendFormat: '' - metric: '' - refId: A - step: 10 - thresholds: 65, 90 - title: Cluster filesystem usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 9 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 20% - prefix: '' - prefixFontSize: 20% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_memory_working_set_bytes{id="/",kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Used - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 10 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (machine_memory_bytes{kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Total - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 11 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: " cores" - postfixFontSize: 30% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{id="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Used - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 12 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: " cores" - postfixFontSize: 30% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (machine_cpu_cores{kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Total - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 13 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_fs_usage_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Used - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 14 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_fs_limit_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Total - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - showTitle: false - title: Total usage - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 3 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 17 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (pod) - interval: 10s - intervalFactor: 1 - legendFormat: "{{ pod }}" - metric: container_cpu - refId: A - step: 10 - timeFrom: - timeShift: - title: Pods CPU usage (5m avg) - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: cumulative - transparent: false - type: graph - xaxis: - show: true - yaxes: - - format: none - label: cores - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - showTitle: false - title: Pods CPU usage - - collapse: true - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 3 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 23 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{systemd_service_name!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (systemd_service_name) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "{{ systemd_service_name }}" - metric: container_cpu - refId: A - step: 10 - timeFrom: - timeShift: - title: System services CPU usage (5m avg) - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: none - label: cores - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: System services CPU usage - - collapse: true - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 3 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 24 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: false - min: false - rightSide: true - show: true - sideWidth: - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{image!="",name=~"^k8s_.*",container!="POD",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (container, pod) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: 'pod: {{ pod }} | {{ container }}' - metric: container_cpu - refId: A - step: 10 - - expr: sum (rate (container_cpu_usage_seconds_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, name, image) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: 'docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})' - metric: container_cpu - refId: B - step: 10 - - expr: sum (rate (container_cpu_usage_seconds_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, rkt_container_name) - interval: 10s - intervalFactor: 1 - legendFormat: 'rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}' - metric: container_cpu - refId: C - step: 10 - timeFrom: - timeShift: - title: Containers CPU usage (5m avg) - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: none - label: cores - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Containers CPU usage - - collapse: true - editable: true - height: 500px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 3 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 20 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: false - show: true - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (id) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "{{ id }}" - metric: container_cpu - refId: A - step: 10 - timeFrom: - timeShift: - title: All processes CPU usage (5m avg) - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: none - label: cores - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - showTitle: false - title: All processes CPU usage - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 25 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (container_memory_working_set_bytes{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}) - by (pod) - interval: 10s - intervalFactor: 1 - legendFormat: "{{ pod }}" - metric: container_memory_usage:sort_desc - refId: A - step: 10 - timeFrom: - timeShift: - title: Pods memory usage - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Pods memory usage - - collapse: true - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 26 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (container_memory_working_set_bytes{systemd_service_name!="",kubernetes_io_hostname=~"^$Node$"}) - by (systemd_service_name) - interval: 10s - intervalFactor: 1 - legendFormat: "{{ systemd_service_name }}" - metric: container_memory_usage:sort_desc - refId: A - step: 10 - timeFrom: - timeShift: - title: System services memory usage - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: System services memory usage - - collapse: true - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 27 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (container_memory_working_set_bytes{image!="",name=~"^k8s_.*",container!="POD",kubernetes_io_hostname=~"^$Node$"}) - by (container, pod) - interval: 10s - intervalFactor: 1 - legendFormat: 'pod: {{ pod }} | {{ container }}' - metric: container_memory_usage:sort_desc - refId: A - step: 10 - - expr: sum (container_memory_working_set_bytes{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}) - by (kubernetes_io_hostname, name, image) - interval: 10s - intervalFactor: 1 - legendFormat: 'docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})' - metric: container_memory_usage:sort_desc - refId: B - step: 10 - - expr: sum (container_memory_working_set_bytes{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}) - by (kubernetes_io_hostname, rkt_container_name) - interval: 10s - intervalFactor: 1 - legendFormat: 'rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}' - metric: container_memory_usage:sort_desc - refId: C - step: 10 - timeFrom: - timeShift: - title: Containers memory usage - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Containers memory usage - - collapse: true - editable: true - height: 500px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 28 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: false - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (container_memory_working_set_bytes{id!="/",kubernetes_io_hostname=~"^$Node$"}) - by (id) - interval: 10s - intervalFactor: 1 - legendFormat: "{{ id }}" - metric: container_memory_usage:sort_desc - refId: A - step: 10 - timeFrom: - timeShift: - title: All processes memory usage - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: All processes memory usage - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 16 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum (rate (container_network_receive_bytes_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (pod) - interval: 10s - intervalFactor: 1 - legendFormat: "-> {{ pod }}" - metric: network - refId: A - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (pod)' - interval: 10s - intervalFactor: 1 - legendFormat: "<- {{ pod }}" - metric: network - refId: B - step: 10 - timeFrom: - timeShift: - title: Pods network I/O (5m avg) - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Pods network I/O - - collapse: true - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 30 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum (rate (container_network_receive_bytes_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (container, pod) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "-> pod: {{ pod }} | {{ container }}" - metric: network - refId: B - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (container, pod)' - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "<- pod: {{ pod }} | {{ container }}" - metric: network - refId: D - step: 10 - - expr: sum (rate (container_network_receive_bytes_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, name, image) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "-> docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name - }})" - metric: network - refId: A - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, name, image)' - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "<- docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name - }})" - metric: network - refId: C - step: 10 - - expr: sum (rate (container_network_transmit_bytes_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, rkt_container_name) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "-> rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name - }}" - metric: network - refId: E - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, rkt_container_name)' - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "<- rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name - }}" - metric: network - refId: F - step: 10 - timeFrom: - timeShift: - title: Containers network I/O (5m avg) - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Containers network I/O - - collapse: true - editable: true - height: 500px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 29 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: false - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum (rate (container_network_receive_bytes_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (id) - interval: 10s - intervalFactor: 1 - legendFormat: "-> {{ id }}" - metric: network - refId: A - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (id)' - interval: 10s - intervalFactor: 1 - legendFormat: "<- {{ id }}" - metric: network - refId: B - step: 10 - timeFrom: - timeShift: - title: All processes network I/O (5m avg) - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: All processes network I/O - time: - from: now-5m - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: ".*" - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: true - multi: false - name: Node - options: [] - query: label_values(kubernetes_io_hostname) - refresh: 1 - type: query - annotations: - list: [] - refresh: 5m - schemaVersion: 12 - version: 13 - links: [] - gnetId: 315 + containers: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "3.1.1" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.3.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Monitors Kubernetes cluster using Prometheus. Shows overall cluster CPU / Memory / Filesystem usage as well as individual pod, containers, systemd services statistics. Uses cAdvisor metrics only.", + "overwrite": true, + "editable": false, + "gnetId": 315, + "graphTooltip": 0, + "id": 32, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 33, + "panels": [], + "title": "Network I/O pressure", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 5, + "w": 24, + "x": 0, + "y": 1 + }, + "height": "200px", + "id": 32, + "isNew": true, + "legend": { + "alignAsTable": false, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (container_network_receive_bytes_total{kubernetes_io_hostname=~\"^$Node$\"}[5m]))", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "Received", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{kubernetes_io_hostname=~\"^$Node$\"}[5m]))", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "Sent", + "metric": "network", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network I/O pressure", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 6 + }, + "id": 34, + "panels": [], + "title": "Total usage", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 8, + "x": 0, + "y": 7 + }, + "height": "180px", + "id": 4, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{id=\"/\",kubernetes_io_hostname=~\"^$Node$\"}) / sum (machine_memory_bytes{kubernetes_io_hostname=~\"^$Node$\"}) * 100", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "65, 90", + "title": "Cluster memory usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 8, + "x": 8, + "y": 7 + }, + "height": "180px", + "id": 6, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{id=\"/\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) / sum (machine_cpu_cores{kubernetes_io_hostname=~\"^$Node$\"}) * 100", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "65, 90", + "title": "Cluster CPU usage (5m avg)", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 8, + "x": 16, + "y": 7 + }, + "height": "180px", + "id": 7, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (container_fs_usage_bytes{device=~\"^/dev/[sv]da[0-9]$\",id=~\"/.+\",kubernetes_io_hostname=~\"^$Node$\"}) / sum (container_fs_limit_bytes{device=~\"^/dev/[sv]da[0-9]$\",id=~\"/.+\",kubernetes_io_hostname=~\"^$Node$\"}) * 100", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": "65, 90", + "title": "Cluster filesystem usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 0, + "y": 12 + }, + "height": "1px", + "id": 9, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "20%", + "prefix": "", + "prefixFontSize": "20%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{id=\"/\",kubernetes_io_hostname=~\"^$Node$\"})", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Used", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 4, + "y": 12 + }, + "height": "1px", + "id": 10, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (machine_memory_bytes{kubernetes_io_hostname=~\"^$Node$\"})", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Total", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 8, + "y": 12 + }, + "height": "1px", + "id": 11, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": " cores", + "postfixFontSize": "30%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{id=\"/\",kubernetes_io_hostname=~\"^$Node$\"}[5m]))", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Used", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 12, + "y": 12 + }, + "height": "1px", + "id": 12, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": " cores", + "postfixFontSize": "30%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (machine_cpu_cores{kubernetes_io_hostname=~\"^$Node$\"})", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Total", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 16, + "y": 12 + }, + "height": "1px", + "id": 13, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (container_fs_usage_bytes{device=~\"^/dev/[sv]da[0-9]$\",id=~\"/.+\",kubernetes_io_hostname=~\"^$Node$\"})", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Used", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 20, + "y": 12 + }, + "height": "1px", + "id": 14, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (container_fs_limit_bytes{device=~\"^/dev/[sv]da[0-9]$\",id=~\"/.+\",kubernetes_io_hostname=~\"^$Node$\"})", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Total", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 15 + }, + "id": 35, + "panels": [], + "title": "Pods CPU usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 3, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 16 + }, + "height": "", + "id": 17, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ pod }}", + "metric": "container_cpu", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Pods CPU usage (5m avg)", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": true, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 23 + }, + "id": 36, + "panels": [ + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 3, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 23 + }, + "height": "", + "id": 24, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": null, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",name=~\"^k8s_.*\",container!=\"POD\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (container, pod)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "pod: {{ pod }} | {{ container }}", + "metric": "container_cpu", + "refId": "A", + "step": 10 + }, + { + "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (kubernetes_io_hostname, name, image)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})", + "metric": "container_cpu", + "refId": "B", + "step": 10 + }, + { + "expr": "sum (rate (container_cpu_usage_seconds_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}", + "metric": "container_cpu", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Containers CPU usage (5m avg)", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "show": true + }, + "yaxes": [ + { + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + } + ], + "title": "Containers CPU usage", + "type": "row" + }, + { + "collapsed": true, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 24 + }, + "id": 37, + "panels": [ + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 3, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 13, + "w": 24, + "x": 0, + "y": 24 + }, + "id": 20, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (id)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ id }}", + "metric": "container_cpu", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "All processes CPU usage (5m avg)", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "show": true + }, + "yaxes": [ + { + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + } + ], + "repeat": null, + "title": "All processes CPU usage", + "type": "row" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 25 + }, + "id": 38, + "panels": [], + "title": "Pods memory usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 26 + }, + "id": 25, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{image!=\"\",kubernetes_io_hostname=~\"^$Node$\"}) by (pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ pod }}", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Pods memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": true, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 33 + }, + "id": 39, + "panels": [ + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 33 + }, + "id": 27, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{image!=\"\",name=~\"^k8s_.*\",container!=\"POD\",kubernetes_io_hostname=~\"^$Node$\"}) by (container, pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "pod: {{ pod }} | {{ container }}", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + }, + { + "expr": "sum (container_memory_working_set_bytes{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\"}) by (kubernetes_io_hostname, name, image)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})", + "metric": "container_memory_usage:sort_desc", + "refId": "B", + "step": 10 + }, + { + "expr": "sum (container_memory_working_set_bytes{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\"}) by (kubernetes_io_hostname, rkt_container_name)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}", + "metric": "container_memory_usage:sort_desc", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Containers memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "show": true + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + } + ], + "title": "Containers memory usage", + "type": "row" + }, + { + "collapsed": true, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 34 + }, + "id": 40, + "panels": [ + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 13, + "w": 24, + "x": 0, + "y": 34 + }, + "id": 28, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\"}) by (id)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ id }}", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "All processes memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "show": true + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + } + ], + "title": "All processes memory usage", + "type": "row" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 35 + }, + "id": 41, + "panels": [], + "title": "Pods network I/O", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 36 + }, + "id": 16, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> {{ pod }}", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- {{ pod }}", + "metric": "network", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Pods network I/O (5m avg)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "show": true + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "collapsed": true, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 43 + }, + "id": 42, + "panels": [ + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 43 + }, + "id": 30, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",name=~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (container, pod)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> pod: {{ pod }} | {{ container }}", + "metric": "network", + "refId": "B", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",name=~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (container, pod)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- pod: {{ pod }} | {{ container }}", + "metric": "network", + "refId": "D", + "step": 10 + }, + { + "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (kubernetes_io_hostname, name, image)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (kubernetes_io_hostname, name, image)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})", + "metric": "network", + "refId": "C", + "step": 10 + }, + { + "expr": "sum (rate (container_network_transmit_bytes_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}", + "metric": "network", + "refId": "E", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}", + "metric": "network", + "refId": "F", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Containers network I/O (5m avg)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "show": true + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + } + ], + "title": "Containers network I/O", + "type": "row" + }, + { + "collapsed": true, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 44 + }, + "id": 43, + "panels": [ + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 13, + "w": 24, + "x": 0, + "y": 44 + }, + "id": 29, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (container_network_receive_bytes_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (id)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> {{ id }}", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\"}[5m])) by (id)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- {{ id }}", + "metric": "network", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "All processes network I/O (5m avg)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "show": true + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + } + ], + "title": "All processes network I/O", + "type": "row" + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "kubernetes" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": true, + "label": null, + "multi": false, + "name": "Node", + "options": [], + "query": "label_values(kubernetes_io_hostname)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-5m", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Container Metrics (cAdvisor)", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/coredns.yaml b/grafana/values_overrides/coredns.yaml index 009b6f806..ba37d3897 100644 --- a/grafana/values_overrides/coredns.yaml +++ b/grafana/values_overrides/coredns.yaml @@ -2,1015 +2,1378 @@ # CoreDNS conf: dashboards: - coredns: - __inputs: - - name: prometheus - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.4.3 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - annotations: - list: [] - editable: true - gnetId: 5926 - graphTooltip: 0 - hideControls: false - id: - links: [] - rows: - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 1 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: total - yaxis: 2 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - by (proto) - format: time_series - intervalFactor: 2 - legendFormat: "{{proto}}" - refId: A - step: 60 - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - format: time_series - intervalFactor: 2 - legendFormat: total - refId: B - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (total) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 12 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: total - yaxis: 2 - - alias: other - yaxis: 2 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_request_type_count_total{instance=~"$instance"}[5m])) - by (type) - intervalFactor: 2 - legendFormat: "{{type}}" - refId: A - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (by qtype) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 2 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: total - yaxis: 2 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - by (zone) - intervalFactor: 2 - legendFormat: "{{zone}}" - refId: A - step: 60 - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - intervalFactor: 2 - legendFormat: total - refId: B - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (by zone) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 10 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: total - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_request_do_count_total{instance=~"$instance"}[5m])) - intervalFactor: 2 - legendFormat: DO - refId: A - step: 40 - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - intervalFactor: 2 - legendFormat: total - refId: B - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Requests (DO bit) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 9 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: tcp:90 - yaxis: 2 - - alias: 'tcp:99 ' - yaxis: 2 - - alias: tcp:50 - yaxis: 2 - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:99 " - refId: A - step: 60 - - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:90" - refId: B - step: 60 - - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:50" - refId: C - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (size, udp) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 14 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: tcp:90 - yaxis: 1 - - alias: 'tcp:99 ' - yaxis: 1 - - alias: tcp:50 - yaxis: 1 - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:99 " - refId: A - step: 60 - - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:90" - refId: B - step: 60 - - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:50" - refId: C - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (size,tcp) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Row - titleSize: h6 - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 5 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_response_rcode_count_total{instance=~"$instance"}[5m])) - by (rcode) - intervalFactor: 2 - legendFormat: "{{rcode}}" - refId: A - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Responses (by rcode) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m])) - by (le, job)) - intervalFactor: 2 - legendFormat: 99% - refId: A - step: 40 - - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m])) - by (le)) - intervalFactor: 2 - legendFormat: 90% - refId: B - step: 40 - - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m])) - by (le)) - intervalFactor: 2 - legendFormat: 50% - refId: C - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Responses (duration) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 8 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: udp:50% - yaxis: 1 - - alias: tcp:50% - yaxis: 2 - - alias: tcp:90% - yaxis: 2 - - alias: tcp:99% - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: 'histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:99%" - refId: A - step: 40 - - expr: 'histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance="$instance",proto="udp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:90%" - refId: B - step: 40 - - expr: 'histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:50%" - metric: '' - refId: C - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Responses (size, udp) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 13 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: udp:50% - yaxis: 1 - - alias: tcp:50% - yaxis: 1 - - alias: tcp:90% - yaxis: 1 - - alias: tcp:99% - yaxis: 1 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: 'histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:99%" - refId: A - step: 40 - - expr: 'histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:90%" - refId: B - step: 40 - - expr: 'histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le, proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:50%" - metric: '' - refId: C - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Responses (size, tcp) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 15 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(coredns_cache_size{instance=~"$instance"}) by (type) - intervalFactor: 2 - legendFormat: "{{type}}" - refId: A - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Cache (size) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 16 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: misses - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_cache_hits_total{instance=~"$instance"}[5m])) by (type) - intervalFactor: 2 - legendFormat: hits:{{type}} - refId: A - step: 40 - - expr: sum(rate(coredns_cache_misses_total{instance=~"$instance"}[5m])) by (type) - intervalFactor: 2 - legendFormat: misses - refId: B - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Cache (hitrate) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: 0 - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: - - dns - - coredns - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: ".*" - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: true - label: Instance - multi: false - name: instance - options: [] - query: up{job="coredns"} - refresh: 1 - regex: .*instance="(.*?)".* - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - time: - from: now-3h - to: now - timepicker: - now: true - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: utc - title: CoreDNS - version: 3 - description: A dashboard for the CoreDNS DNS server. + coredns: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.4.3" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "A dashboard for the CoreDNS DNS server.", + "overwrite": true, + "editable": true, + "gnetId": 5926, + "graphTooltip": 0, + "id": 20, + "links": [], + "panels": [ + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 0 + }, + "id": 1, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "total", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_request_count_total{instance=~\"$instance\"}[5m])) by (proto)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{proto}}", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(rate(coredns_dns_request_count_total{instance=~\"$instance\"}[5m]))", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "total", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (total)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 0 + }, + "id": 12, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "total", + "yaxis": 2 + }, + { + "alias": "other", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_request_type_count_total{instance=~\"$instance\"}[5m])) by (type)", + "intervalFactor": 2, + "legendFormat": "{{type}}", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (by qtype)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 0 + }, + "id": 2, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "total", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_request_count_total{instance=~\"$instance\"}[5m])) by (zone)", + "intervalFactor": 2, + "legendFormat": "{{zone}}", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(rate(coredns_dns_request_count_total{instance=~\"$instance\"}[5m]))", + "intervalFactor": 2, + "legendFormat": "total", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (by zone)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 7 + }, + "id": 10, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "total", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_request_do_count_total{instance=~\"$instance\"}[5m]))", + "intervalFactor": 2, + "legendFormat": "DO", + "refId": "A", + "step": 40 + }, + { + "expr": "sum(rate(coredns_dns_request_count_total{instance=~\"$instance\"}[5m]))", + "intervalFactor": 2, + "legendFormat": "total", + "refId": "B", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (DO bit)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 7 + }, + "id": 9, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "tcp:90", + "yaxis": 2 + }, + { + "alias": "tcp:99 ", + "yaxis": 2 + }, + { + "alias": "tcp:50", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:99 ", + "refId": "A", + "step": 60 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:90", + "refId": "B", + "step": 60 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:50", + "refId": "C", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (size, udp)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 7 + }, + "id": 14, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "tcp:90", + "yaxis": 1 + }, + { + "alias": "tcp:99 ", + "yaxis": 1 + }, + { + "alias": "tcp:50", + "yaxis": 1 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:99 ", + "refId": "A", + "step": 60 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:90", + "refId": "B", + "step": 60 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:50", + "refId": "C", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (size,tcp)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 14 + }, + "id": 5, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_response_rcode_count_total{instance=~\"$instance\"}[5m])) by (rcode)", + "intervalFactor": 2, + "legendFormat": "{{rcode}}", + "refId": "A", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Responses (by rcode)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 14 + }, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\"}[5m])) by (le, job))", + "intervalFactor": 2, + "legendFormat": "99%", + "refId": "A", + "step": 40 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\"}[5m])) by (le))", + "intervalFactor": 2, + "legendFormat": "90%", + "refId": "B", + "step": 40 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\"}[5m])) by (le))", + "intervalFactor": 2, + "legendFormat": "50%", + "refId": "C", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Responses (duration)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 21 + }, + "id": 8, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "udp:50%", + "yaxis": 1 + }, + { + "alias": "tcp:50%", + "yaxis": 2 + }, + { + "alias": "tcp:90%", + "yaxis": 2 + }, + { + "alias": "tcp:99%", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:99%", + "refId": "A", + "step": 40 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=\"$instance\",proto=\"udp\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:90%", + "refId": "B", + "step": 40 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:50%", + "metric": "", + "refId": "C", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Responses (size, udp)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 21 + }, + "id": 13, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "udp:50%", + "yaxis": 1 + }, + { + "alias": "tcp:50%", + "yaxis": 1 + }, + { + "alias": "tcp:90%", + "yaxis": 1 + }, + { + "alias": "tcp:99%", + "yaxis": 1 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:99%", + "refId": "A", + "step": 40 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:90%", + "refId": "B", + "step": 40 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\"}[5m])) by (le, proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:50%", + "metric": "", + "refId": "C", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Responses (size, tcp)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 28 + }, + "id": 15, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(coredns_cache_size{instance=~\"$instance\"}) by (type)", + "intervalFactor": 2, + "legendFormat": "{{type}}", + "refId": "A", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cache (size)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 28 + }, + "id": 16, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "misses", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_cache_hits_total{instance=~\"$instance\"}[5m])) by (type)", + "intervalFactor": 2, + "legendFormat": "hits:{{type}}", + "refId": "A", + "step": 40 + }, + { + "expr": "sum(rate(coredns_cache_misses_total{instance=~\"$instance\"}[5m])) by (type)", + "intervalFactor": 2, + "legendFormat": "misses", + "refId": "B", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cache (hitrate)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "schemaVersion": 18, + "style": "dark", + "tags": [ + "dns", + "coredns" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": true, + "label": "Instance", + "multi": false, + "name": "instance", + "options": [], + "query": "up{job=\"coredns\"}", + "refresh": 1, + "regex": ".*instance=\"(.*?)\".*", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "now": true, + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "CoreDNS", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/elasticsearch.yaml b/grafana/values_overrides/elasticsearch.yaml index 8c1c31022..f7a317f41 100644 --- a/grafana/values_overrides/elasticsearch.yaml +++ b/grafana/values_overrides/elasticsearch.yaml @@ -2,2630 +2,3474 @@ # an Elasticsearch cluster conf: dashboards: - elasticsearch: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.6.3 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: - - builtIn: 1 - datasource: "-- Grafana --" - enable: true - hide: true - iconColor: rgba(0, 211, 255, 1) - name: Annotations & Alerts - type: dashboard - editable: true - gnetId: 4358 - graphTooltip: 1 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(178, 49, 13, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 8 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 5 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: (sum(elasticsearch_cluster_health_status{cluster=~"$cluster",color="green"})*2)+sum(elasticsearch_cluster_health_status{cluster=~"$cluster",color="yellow"}) - format: time_series - intervalFactor: 3 - legendFormat: '' - metric: '' - refId: A - step: 40 - thresholds: '0,1,2' - title: Cluster health status - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: GREEN - value: '2' - - op: "=" - text: YELLOW - value: '1' - - op: "=" - text: RED - value: '0' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 10 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: sum(elasticsearch_cluster_health_number_of_nodes{cluster=~"$cluster"}) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - metric: '' - refId: A - step: 40 - thresholds: '' - title: Nodes - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 9 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_number_of_data_nodes{cluster="$cluster"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - metric: '' - refId: A - step: 40 - thresholds: '' - title: Data nodes - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - hideTimeOverride: true - id: 16 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_number_of_pending_tasks{cluster="$cluster"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - metric: '' - refId: A - step: 40 - thresholds: '' - title: Pending tasks - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Cluster - titleSize: h6 - - collapse: false - height: '' - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 11 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - repeat: shard_type - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_active_primary_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: active primary shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 39 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_active_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: active shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 40 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_initializing_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: initializing shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 41 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_relocating_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: relocating shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 42 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_unassigned_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: unassigned shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Shards - titleSize: h6 - - collapse: false - height: - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 30 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: elasticsearch_process_cpu_percent{cluster="$cluster",es_master_node="true",name=~"$node"} - format: time_series - instant: false - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - master" - metric: '' - refId: A - step: 10 - - expr: elasticsearch_process_cpu_percent{cluster="$cluster",es_data_node="true",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - data" - metric: '' - refId: B - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: CPU usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percent - label: CPU usage - logBase: 1 - max: 100 - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 0 - grid: {} - height: '400' - id: 31 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: elasticsearch_jvm_memory_used_bytes{cluster="$cluster",name=~"$node",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - used: {{area}}" - metric: '' - refId: A - step: 10 - - expr: elasticsearch_jvm_memory_committed_bytes{cluster="$cluster",name=~"$node",name=~"$node"} - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - committed: {{area}}" - refId: B - step: 10 - - expr: elasticsearch_jvm_memory_max_bytes{cluster="$cluster",name=~"$node",name=~"$node"} - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - max: {{area}}" - refId: C - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: JVM memory usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: Memory - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 32 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: 1-(elasticsearch_filesystem_data_available_bytes{cluster="$cluster"}/elasticsearch_filesystem_data_size_bytes{cluster="$cluster",name=~"$node"}) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - {{path}}" - metric: '' - refId: A - step: 10 - thresholds: - - colorMode: custom - fill: true - fillColor: rgba(216, 200, 27, 0.27) - op: gt - value: 0.8 - - colorMode: custom - fill: true - fillColor: rgba(234, 112, 112, 0.22) - op: gt - value: 0.9 - timeFrom: - timeShift: - title: Disk usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percentunit - label: Disk Usage % - logBase: 1 - max: 1 - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 47 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sort: max - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: sent - transform: negative-Y - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: irate(elasticsearch_transport_tx_size_bytes_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} -sent" - refId: D - step: 10 - - expr: irate(elasticsearch_transport_rx_size_bytes_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} -received" - refId: C - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Network usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: Bps - label: Bytes/sec - logBase: 1 - max: - min: - show: true - - format: pps - label: '' - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: System - titleSize: h6 - - collapse: false - height: '' - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 1 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: elasticsearch_indices_docs{cluster="$cluster",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Documents count - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Documents - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 24 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: irate(elasticsearch_indices_indexing_index_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Documents indexed rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: index calls/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 25 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_docs_deleted{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Documents deleted rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Documents/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 26 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_merges_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Documents merged rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Documents/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Documents - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 48 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: irate(elasticsearch_indices_indexing_index_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - indexing" - metric: '' - refId: A - step: 4 - - expr: irate(elasticsearch_indices_search_query_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - query" - refId: B - step: 4 - - expr: irate(elasticsearch_indices_search_fetch_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - fetch" - refId: C - step: 4 - - expr: irate(elasticsearch_indices_merges_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - merges" - refId: D - step: 4 - - expr: irate(elasticsearch_indices_refresh_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - refresh" - refId: E - step: 4 - - expr: irate(elasticsearch_indices_flush_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - flush" - refId: F - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Total Operations rate - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Operations/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 49 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: irate(elasticsearch_indices_indexing_index_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - indexing" - metric: '' - refId: A - step: 4 - - expr: irate(elasticsearch_indices_search_query_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - query" - refId: B - step: 4 - - expr: irate(elasticsearch_indices_search_fetch_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - fetch" - refId: C - step: 4 - - expr: irate(elasticsearch_indices_merges_total_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - merges" - refId: D - step: 4 - - expr: irate(elasticsearch_indices_refresh_total_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - refresh" - refId: E - step: 4 - - expr: irate(elasticsearch_indices_flush_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - flush" - refId: F - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Total Operations time - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: ms - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Total Operations stats - titleSize: h6 - - collapse: false - height: '' - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 33 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: 'rate(elasticsearch_indices_search_query_time_seconds{cluster="$cluster",name=~"$node"}[$interval]) ' - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Query time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: ms - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 5 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_indexing_index_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Indexing time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: ms - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 3 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_merges_total_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Merging time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Times - titleSize: h6 - - collapse: false - height: - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 4 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: elasticsearch_indices_fielddata_memory_size_bytes{cluster="$cluster",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Field data memory size - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: Memory - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 34 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_fielddata_evictions{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Field data evictions - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Evictions/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 35 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: elasticsearch_indices_query_cache_memory_size_bytes{cluster="$cluster",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Query cache size - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: Size - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 36 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_query_cache_evictions{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Query cache evictions - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Evictions/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Caches - titleSize: h6 - - collapse: false - height: 728 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 45 - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: ' irate(elasticsearch_thread_pool_rejected_count{cluster="$cluster",name=~"$node"}[$interval])' - format: time_series - intervalFactor: 2 - legendFormat: "{{name}} - {{ type }}" - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Thread Pool operations rejected - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 46 - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: elasticsearch_thread_pool_active_count{cluster="$cluster",name=~"$node"} - format: time_series - intervalFactor: 2 - legendFormat: "{{name}} - {{ type }}" - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Thread Pool operations queued - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - height: '' - id: 43 - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: elasticsearch_thread_pool_active_count{cluster="$cluster",name=~"$node"} - format: time_series - intervalFactor: 2 - legendFormat: "{{name}} - {{ type }}" - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Thread Pool threads active - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 44 - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: irate(elasticsearch_thread_pool_completed_count{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{name}} - {{ type }}" - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Thread Pool operations completed - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Thread Pool - titleSize: h6 - - collapse: false - height: - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 7 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_jvm_gc_collection_seconds_count{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}} - {{gc}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: GC count - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: GCs - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 27 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: rate(elasticsearch_jvm_gc_collection_seconds_count{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}} - {{gc}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: GC time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: JVM Garbage Collection - titleSize: h6 - schemaVersion: 14 - style: dark - tags: - - elasticsearch - - App - templating: - list: - - auto: true - auto_count: 30 - auto_min: 10s - current: - text: auto - value: "$__auto_interval" - hide: 0 - label: Interval - name: interval - options: - - selected: true - text: auto - value: "$__auto_interval" - - selected: false - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 2 - type: interval - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Instance - multi: false - name: cluster - options: [] - query: label_values(elasticsearch_cluster_health_status,cluster) - refresh: 1 - regex: '' - sort: 1 - tagValuesQuery: - tags: [] - tagsQuery: - type: query - useTags: false - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: true - label: node - multi: true - name: node - options: [] - query: label_values(elasticsearch_process_cpu_percent,name) - refresh: 1 - regex: '' - sort: 1 - tagValuesQuery: - tags: [] - tagsQuery: - type: query - useTags: false - time: - from: now-12h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Elasticsearch - version: 1 - description: Elasticsearch detailed dashboard + elasticsearch: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.6.3" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Elasticsearch detailed dashboard", + "overwrite": true, + "editable": true, + "gnetId": 4358, + "graphTooltip": 1, + "id": 23, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 50, + "panels": [], + "repeat": null, + "title": "Cluster", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(178, 49, 13, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 10, + "x": 0, + "y": 1 + }, + "height": "50", + "id": 8, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(elasticsearch_cluster_health_status{cluster=~\"$cluster\",color=\"green\"})*2)+sum(elasticsearch_cluster_health_status{cluster=~\"$cluster\",color=\"yellow\"})", + "format": "time_series", + "intervalFactor": 3, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "0,1,2", + "title": "Cluster health status", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "GREEN", + "value": "2" + }, + { + "op": "=", + "text": "YELLOW", + "value": "1" + }, + { + "op": "=", + "text": "RED", + "value": "0" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 10, + "y": 1 + }, + "height": "50", + "id": 10, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(elasticsearch_cluster_health_number_of_nodes{cluster=~\"$cluster\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "Nodes", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 14, + "y": 1 + }, + "height": "50", + "id": 9, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_number_of_data_nodes{cluster=\"$cluster\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "Data nodes", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 6, + "x": 18, + "y": 1 + }, + "height": "50", + "hideTimeOverride": true, + "id": 16, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_number_of_pending_tasks{cluster=\"$cluster\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "Pending tasks", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 4 + }, + "id": 51, + "panels": [], + "repeat": null, + "title": "Shards", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 0, + "y": 5 + }, + "height": "50", + "id": 11, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "repeat": "shard_type", + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_active_primary_shards{cluster=\"$cluster\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "active primary shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 4, + "y": 5 + }, + "height": "50", + "id": 39, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_active_shards{cluster=\"$cluster\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "active shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 8, + "y": 5 + }, + "height": "50", + "id": 40, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_initializing_shards{cluster=\"$cluster\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "initializing shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 12, + "y": 5 + }, + "height": "50", + "id": 41, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_relocating_shards{cluster=\"$cluster\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "relocating shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 16, + "y": 5 + }, + "height": "50", + "id": 42, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_unassigned_shards{cluster=\"$cluster\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "unassigned shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 52, + "panels": [], + "repeat": null, + "title": "System", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 0, + "y": 9 + }, + "height": "400", + "id": 30, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_process_cpu_percent{cluster=\"$cluster\",es_master_node=\"true\",name=~\"$node\"}", + "format": "time_series", + "instant": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - master", + "metric": "", + "refId": "A", + "step": 10 + }, + { + "expr": "elasticsearch_process_cpu_percent{cluster=\"$cluster\",es_data_node=\"true\",name=~\"$node\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - data", + "metric": "", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "CPU usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percent", + "label": "CPU usage", + "logBase": 1, + "max": 100, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 6, + "y": 9 + }, + "height": "400", + "id": 31, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_jvm_memory_used_bytes{cluster=\"$cluster\",name=~\"$node\",name=~\"$node\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - used: {{area}}", + "metric": "", + "refId": "A", + "step": 10 + }, + { + "expr": "elasticsearch_jvm_memory_committed_bytes{cluster=\"$cluster\",name=~\"$node\",name=~\"$node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - committed: {{area}}", + "refId": "B", + "step": 10 + }, + { + "expr": "elasticsearch_jvm_memory_max_bytes{cluster=\"$cluster\",name=~\"$node\",name=~\"$node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - max: {{area}}", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "JVM memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": "Memory", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 12, + "y": 9 + }, + "height": "400", + "id": 32, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "1-(elasticsearch_filesystem_data_available_bytes{cluster=\"$cluster\"}/elasticsearch_filesystem_data_size_bytes{cluster=\"$cluster\",name=~\"$node\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - {{path}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [ + { + "colorMode": "custom", + "fill": true, + "fillColor": "rgba(216, 200, 27, 0.27)", + "op": "gt", + "value": 0.8 + }, + { + "colorMode": "custom", + "fill": true, + "fillColor": "rgba(234, 112, 112, 0.22)", + "op": "gt", + "value": 0.9 + } + ], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Disk usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percentunit", + "label": "Disk Usage %", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 18, + "y": 9 + }, + "height": "400", + "id": 47, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sort": "max", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "sent", + "transform": "negative-Y" + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_transport_tx_size_bytes_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} -sent", + "refId": "D", + "step": 10 + }, + { + "expr": "irate(elasticsearch_transport_rx_size_bytes_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} -received", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": "Bytes/sec", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "pps", + "label": "", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 19 + }, + "id": 53, + "panels": [], + "repeat": null, + "title": "Documents", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 0, + "y": 20 + }, + "height": "400", + "id": 1, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_indices_docs{cluster=\"$cluster\",name=~\"$node\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Documents count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Documents", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 6, + "y": 20 + }, + "height": "400", + "id": 24, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_indices_indexing_index_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Documents indexed rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "index calls/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 12, + "y": 20 + }, + "height": "400", + "id": 25, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_docs_deleted{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Documents deleted rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Documents/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 18, + "y": 20 + }, + "height": "400", + "id": 26, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_merges_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Documents merged rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Documents/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 30 + }, + "id": 54, + "panels": [], + "repeat": null, + "title": "Total Operations stats", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 12, + "x": 0, + "y": 31 + }, + "height": "400", + "id": 48, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_indices_indexing_index_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - indexing", + "metric": "", + "refId": "A", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_search_query_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - query", + "refId": "B", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_search_fetch_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - fetch", + "refId": "C", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_merges_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - merges", + "refId": "D", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_refresh_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - refresh", + "refId": "E", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_flush_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - flush", + "refId": "F", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Total Operations rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Operations/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 12, + "x": 12, + "y": 31 + }, + "height": "400", + "id": 49, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_indices_indexing_index_time_seconds_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - indexing", + "metric": "", + "refId": "A", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_search_query_time_ms_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - query", + "refId": "B", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_search_fetch_time_ms_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - fetch", + "refId": "C", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_merges_total_time_ms_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - merges", + "refId": "D", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_refresh_total_time_ms_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - refresh", + "refId": "E", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_flush_time_ms_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - flush", + "refId": "F", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Total Operations time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ms", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 41 + }, + "id": 55, + "panels": [], + "repeat": null, + "title": "Times", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 8, + "x": 0, + "y": 42 + }, + "height": "400", + "id": 33, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_search_query_time_seconds{cluster=\"$cluster\",name=~\"$node\"}[$interval]) ", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Query time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ms", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 8, + "x": 8, + "y": 42 + }, + "height": "400", + "id": 5, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_indexing_index_time_seconds_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Indexing time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ms", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 8, + "x": 16, + "y": 42 + }, + "height": "400", + "id": 3, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_merges_total_time_seconds_total{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Merging time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 52 + }, + "id": 56, + "panels": [], + "repeat": null, + "title": "Caches", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 0, + "y": 53 + }, + "height": "400", + "id": 4, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_indices_fielddata_memory_size_bytes{cluster=\"$cluster\",name=~\"$node\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Field data memory size", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": "Memory", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 6, + "y": 53 + }, + "height": "400", + "id": 34, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_fielddata_evictions{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Field data evictions", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Evictions/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 12, + "y": 53 + }, + "height": "400", + "id": 35, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_indices_query_cache_memory_size_bytes{cluster=\"$cluster\",name=~\"$node\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Query cache size", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": "Size", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 18, + "y": 53 + }, + "height": "400", + "id": 36, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_query_cache_evictions{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Query cache evictions", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Evictions/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 63 + }, + "id": 57, + "panels": [], + "repeat": null, + "title": "Thread Pool", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 19, + "w": 6, + "x": 0, + "y": 64 + }, + "id": 45, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": " irate(elasticsearch_thread_pool_rejected_count{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{ type }}", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Thread Pool operations rejected", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 19, + "w": 6, + "x": 6, + "y": 64 + }, + "id": 46, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_thread_pool_active_count{cluster=\"$cluster\",name=~\"$node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{ type }}", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Thread Pool operations queued", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 19, + "w": 6, + "x": 12, + "y": 64 + }, + "height": "", + "id": 43, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_thread_pool_active_count{cluster=\"$cluster\",name=~\"$node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{ type }}", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Thread Pool threads active", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 19, + "w": 6, + "x": 18, + "y": 64 + }, + "id": 44, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_thread_pool_completed_count{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{ type }}", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Thread Pool operations completed", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 83 + }, + "id": 58, + "panels": [], + "repeat": null, + "title": "JVM Garbage Collection", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 12, + "x": 0, + "y": 84 + }, + "height": "400", + "id": 7, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_jvm_gc_collection_seconds_count{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{gc}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "GC count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "GCs", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 12, + "x": 12, + "y": 84 + }, + "height": "400", + "id": 27, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_jvm_gc_collection_seconds_count{cluster=\"$cluster\",name=~\"$node\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{gc}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "GC time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "elasticsearch", + "App" + ], + "templating": { + "list": [ + { + "auto": true, + "auto_count": 30, + "auto_min": "10s", + "current": { + "text": "auto", + "value": "$__auto_interval_interval" + }, + "hide": 0, + "label": "Interval", + "name": "interval", + "options": [ + { + "selected": true, + "text": "auto", + "value": "$__auto_interval_interval" + }, + { + "selected": false, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + }, + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Instance", + "multi": false, + "name": "cluster", + "options": [], + "query": "label_values(elasticsearch_cluster_health_status,cluster)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 1, + "tagValuesQuery": null, + "tags": [], + "tagsQuery": null, + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": true, + "label": "node", + "multi": true, + "name": "node", + "options": [], + "query": "label_values(elasticsearch_process_cpu_percent,name)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 1, + "tagValuesQuery": null, + "tags": [], + "tagsQuery": null, + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Elasticsearch", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/home_dashboard.yaml b/grafana/values_overrides/home_dashboard.yaml index b66c463cf..dd8f2dde9 100644 --- a/grafana/values_overrides/home_dashboard.yaml +++ b/grafana/values_overrides/home_dashboard.yaml @@ -1,94 +1,109 @@ -# This overrides file provides a reference for dashboards for +# This override file provides a reference for dashboards for # customized OSH Welcome Page conf: dashboards: - home_dashboard: - annotations: - list: - - builtIn: 1 - datasource: "-- Grafana --" - enable: true - hide: true - iconColor: rgba(0, 211, 255, 1) - name: Annotations & Alerts - type: dashboard - editable: false - gnetId: - graphTooltip: 0 - id: 51 - links: [] - panels: - - content: |- -
- OSH Home Dashboard -
- editable: true - gridPos: - h: 3 - w: 24 - x: 0 - 'y': 0 - id: 1 - links: [] - mode: html - options: {} - style: {} - title: '' - transparent: true - type: text - - folderId: 0 - gridPos: - h: 10 - w: 13 - x: 6 - 'y': 3 - headings: true - id: 3 - limit: 30 - links: [] - options: {} - query: '' - recent: true - search: false - starred: true - tags: [] - title: '' - type: dashlist - schemaVersion: 18 - style: dark - tags: [] - templating: - list: [] - time: - from: now-1h - to: now - timepicker: - hidden: true - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - type: timepicker - timezone: browser - title: OSH Home - version: 3 + home_dashboard: |- + { + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": true, + "gnetId": null, + "graphTooltip": 0, + "id": 66, + "links": [], + "panels": [ + { + "content": "
\n OSH Home Dashboard\n
", + "editable": true, + "gridPos": { + "h": 3, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 1, + "links": [], + "mode": "html", + "options": {}, + "style": {}, + "title": "", + "transparent": true, + "type": "text" + }, + { + "folderId": 0, + "gridPos": { + "h": 10, + "w": 13, + "x": 6, + "y": 3 + }, + "headings": true, + "id": 3, + "limit": 30, + "links": [], + "options": {}, + "query": "", + "recent": true, + "search": false, + "starred": true, + "tags": [], + "title": "", + "type": "dashlist" + } + ], + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "hidden": true, + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ], + "type": "timepicker" + }, + "timezone": "browser", + "title": "OSH Home", + "version": 1 + } manifests: job_add_home_dashboard: true \ No newline at end of file diff --git a/grafana/values_overrides/kubernetes.yaml b/grafana/values_overrides/kubernetes.yaml index b9b35e34a..b1e892ef7 100644 --- a/grafana/values_overrides/kubernetes.yaml +++ b/grafana/values_overrides/kubernetes.yaml @@ -2,1560 +2,2112 @@ # reflect the overall state of a Kubernetes deployment conf: dashboards: - kubernetes_capacity_planning: - __inputs: - - name: DS_PROMETHEUS - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.4.1 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: [] - description: '' - editable: true - gnetId: 22 - graphTooltip: 0 - hideControls: false - id: - links: [] - refresh: false - rows: - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(node_cpu{mode="idle"}[2m])) * 100 - hide: false - intervalFactor: 10 - legendFormat: '' - refId: A - step: 50 - thresholds: [] - timeFrom: - timeShift: - title: Idle cpu - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percent - label: cpu usage - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 9 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(node_load1) - intervalFactor: 4 - legendFormat: load 1m - refId: A - step: 20 - target: '' - - expr: sum(node_load5) - intervalFactor: 4 - legendFormat: load 5m - refId: B - step: 20 - target: '' - - expr: sum(node_load15) - intervalFactor: 4 - legendFormat: load 15m - refId: C - step: 20 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: System load - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percentunit - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 4 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: node_memory_SwapFree{instance="172.17.0.1:9100",job="prometheus"} - yaxis: 2 - spaceLength: 10 - span: 9 - stack: true - steppedLine: false - targets: - - expr: sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - - sum(node_memory_Cached) - intervalFactor: 2 - legendFormat: memory usage - metric: memo - refId: A - step: 10 - target: '' - - expr: sum(node_memory_Buffers) - interval: '' - intervalFactor: 2 - legendFormat: memory buffers - metric: memo - refId: B - step: 10 - target: '' - - expr: sum(node_memory_Cached) - interval: '' - intervalFactor: 2 - legendFormat: memory cached - metric: memo - refId: C - step: 10 - target: '' - - expr: sum(node_memory_MemFree) - interval: '' - intervalFactor: 2 - legendFormat: memory free - metric: memo - refId: D - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Memory usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 5 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: "((sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - - sum(node_memory_Cached)) / sum(node_memory_MemTotal)) * 100" - intervalFactor: 2 - metric: '' - refId: A - step: 60 - target: '' - thresholds: 80, 90 - title: Memory usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 246 - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 6 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: read - yaxis: 1 - - alias: '{instance="172.17.0.1:9100"}' - yaxis: 2 - - alias: io time - yaxis: 2 - spaceLength: 10 - span: 9 - stack: false - steppedLine: false - targets: - - expr: sum(rate(node_disk_bytes_read[5m])) - hide: false - intervalFactor: 4 - legendFormat: read - refId: A - step: 20 - target: '' - - expr: sum(rate(node_disk_bytes_written[5m])) - intervalFactor: 4 - legendFormat: written - refId: B - step: 20 - - expr: sum(rate(node_disk_io_time_ms[5m])) - intervalFactor: 4 - legendFormat: io time - refId: C - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Disk I/O - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: ms - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percentunit - gauge: - maxValue: 1 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 12 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(node_filesystem_size{device!="rootfs"}) - sum(node_filesystem_free{device!="rootfs"})) - / sum(node_filesystem_size{device!="rootfs"}) - intervalFactor: 2 - refId: A - step: 60 - target: '' - thresholds: 0.75, 0.9 - title: Disk space usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 8 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: 'transmitted ' - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(node_network_receive_bytes{device!~"lo"}[5m])) - hide: false - intervalFactor: 2 - legendFormat: '' - refId: A - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Network received - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 10 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: 'transmitted ' - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(node_network_transmit_bytes{device!~"lo"}[5m])) - hide: false - intervalFactor: 2 - legendFormat: '' - refId: B - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Network transmitted - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: bytes - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 276 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 11 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 9 - stack: false - steppedLine: false - targets: - - expr: sum(kube_pod_info) - format: time_series - intervalFactor: 2 - legendFormat: Current number of Pods - refId: A - step: 10 - - expr: sum(kube_node_status_capacity_pods) - format: time_series - intervalFactor: 2 - legendFormat: Maximum capacity of pods - refId: B - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Cluster Pod Utilization - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 7 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: 100 - (sum(kube_node_status_capacity_pods) - sum(kube_pod_info)) / sum(kube_node_status_capacity_pods) - * 100 - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 60 - target: '' - thresholds: '80,90' - title: Pod Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Kubernetes Capacity Planning - version: 4 - inputs: - - name: prometheus - pluginId: prometheus - type: datasource - value: prometheus - overwrite: true - kubernetes_cluster_status: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.4.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: [] - editable: true - gnetId: - graphTooltip: 0 - hideControls: false - id: - links: [] - rows: - - collapse: false - height: 129 - panels: - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 5 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 6 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: sum(up{job=~"apiserver|kube-scheduler|kube-controller-manager"} == 0) - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '1,3' - title: Control Plane UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: UP - value: 'null' - valueName: total - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 6 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 6 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: sum(ALERTS{alertstate="firing",alertname!="DeadMansSwitch"}) - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '3,5' - title: Alerts Firing - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: '0' - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Cluster Health - titleSize: h6 - - collapse: false - height: 168 - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - decimals: - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 1 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(up{job="apiserver"} == 1) / count(up{job="apiserver"})) * 100 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '50,80' - title: API Servers UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - decimals: - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 2 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(up{job="kube-controller-manager-discovery"} == 1) / count(up{job="kube-controller-manager-discovery"})) - * 100 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '50,80' - title: Controller Managers UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - decimals: - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 3 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(up{job="kube-scheduler-discovery"} == 1) / count(up{job="kube-scheduler-discovery"})) - * 100 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '50,80' - title: Schedulers UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - hideTimeOverride: false - id: 4 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: count(increase(kube_pod_container_status_restarts{namespace=~"kube-system|tectonic-system"}[1h]) - > 5) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '1,3' - title: Crashlooping Control Plane Pods - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: '0' - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Control Plane Status - titleSize: h6 - - collapse: false - height: 158 - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 8 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: sum(100 - (avg by (instance) (rate(node_cpu{job="node-exporter",mode="idle"}[5m])) - * 100)) / count(node_cpu{job="node-exporter",mode="idle"}) - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '80,90' - title: CPU Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 7 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: "((sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - - sum(node_memory_Cached)) / sum(node_memory_MemTotal)) * 100" - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '80,90' - title: Memory Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 9 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(node_filesystem_size{device!="rootfs"}) - sum(node_filesystem_free{device!="rootfs"})) - / sum(node_filesystem_size{device!="rootfs"}) - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '80,90' - title: Filesystem Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 10 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: 100 - (sum(kube_node_status_capacity_pods) - sum(kube_pod_info)) / sum(kube_node_status_capacity_pods) - * 100 - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '80,90' - title: Pod Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Capacity Planing - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - time: - from: now-6h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: '' - title: Kubernetes Cluster Status - version: 3 - inputs: - - name: prometheus - pluginId: prometheus - type: datasource - value: prometheus - overwrite: true + kubernetes_capacity_planning: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.4.1" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "", + "overwrite": true, + "editable": false, + "gnetId": 22, + "graphTooltip": 0, + "id": 35, + "links": [], + "panels": [ + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 0 + }, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(node_cpu{mode=\"idle\"}[2m])) * 100", + "hide": false, + "intervalFactor": 10, + "legendFormat": "", + "refId": "A", + "step": 50 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Idle cpu", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percent", + "label": "cpu usage", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 0 + }, + "id": 9, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(node_load1)", + "intervalFactor": 4, + "legendFormat": "load 1m", + "refId": "A", + "step": 20, + "target": "" + }, + { + "expr": "sum(node_load5)", + "intervalFactor": 4, + "legendFormat": "load 5m", + "refId": "B", + "step": 20, + "target": "" + }, + { + "expr": "sum(node_load15)", + "intervalFactor": 4, + "legendFormat": "load 15m", + "refId": "C", + "step": 20, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "System load", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percentunit", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 18, + "x": 0, + "y": 7 + }, + "id": 4, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "node_memory_SwapFree{instance=\"172.17.0.1:9100\",job=\"prometheus\"}", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - sum(node_memory_Cached)", + "intervalFactor": 2, + "legendFormat": "memory usage", + "metric": "memo", + "refId": "A", + "step": 10, + "target": "" + }, + { + "expr": "sum(node_memory_Buffers)", + "interval": "", + "intervalFactor": 2, + "legendFormat": "memory buffers", + "metric": "memo", + "refId": "B", + "step": 10, + "target": "" + }, + { + "expr": "sum(node_memory_Cached)", + "interval": "", + "intervalFactor": 2, + "legendFormat": "memory cached", + "metric": "memo", + "refId": "C", + "step": 10, + "target": "" + }, + { + "expr": "sum(node_memory_MemFree)", + "interval": "", + "intervalFactor": 2, + "legendFormat": "memory free", + "metric": "memo", + "refId": "D", + "step": 10, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 7 + }, + "id": 5, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "((sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - sum(node_memory_Cached)) / sum(node_memory_MemTotal)) * 100", + "intervalFactor": 2, + "metric": "", + "refId": "A", + "step": 60, + "target": "" + } + ], + "thresholds": "80, 90", + "title": "Memory usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 18, + "x": 0, + "y": 14 + }, + "id": 6, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "read", + "yaxis": 1 + }, + { + "alias": "{instance=\"172.17.0.1:9100\"}", + "yaxis": 2 + }, + { + "alias": "io time", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(node_disk_bytes_read[5m]))", + "hide": false, + "intervalFactor": 4, + "legendFormat": "read", + "refId": "A", + "step": 20, + "target": "" + }, + { + "expr": "sum(rate(node_disk_bytes_written[5m]))", + "intervalFactor": 4, + "legendFormat": "written", + "refId": "B", + "step": 20 + }, + { + "expr": "sum(rate(node_disk_io_time_ms[5m]))", + "intervalFactor": 4, + "legendFormat": "io time", + "refId": "C", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Disk I/O", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percentunit", + "gauge": { + "maxValue": 1, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 14 + }, + "id": 12, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(node_filesystem_size{device!=\"rootfs\"}) - sum(node_filesystem_free{device!=\"rootfs\"})) / sum(node_filesystem_size{device!=\"rootfs\"})", + "intervalFactor": 2, + "refId": "A", + "step": 60, + "target": "" + } + ], + "thresholds": "0.75, 0.9", + "title": "Disk space usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 21 + }, + "id": 8, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "transmitted ", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(node_network_receive_bytes{device!~\"lo\"}[5m]))", + "hide": false, + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 10, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network received", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 21 + }, + "id": 10, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "transmitted ", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(node_network_transmit_bytes{device!~\"lo\"}[5m]))", + "hide": false, + "intervalFactor": 2, + "legendFormat": "", + "refId": "B", + "step": 10, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network transmitted", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 18, + "x": 0, + "y": 28 + }, + "id": 11, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(kube_pod_info)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Current number of Pods", + "refId": "A", + "step": 10 + }, + { + "expr": "sum(kube_node_status_capacity_pods)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Maximum capacity of pods", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Pod Utilization", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 28 + }, + "id": 7, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "100 - (sum(kube_node_status_capacity_pods) - sum(kube_pod_info)) / sum(kube_node_status_capacity_pods) * 100", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 60, + "target": "" + } + ], + "thresholds": "80,90", + "title": "Pod Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Kubernetes Capacity Planning", + "version": 1 + } + kubernetes_cluster_status: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.4.1" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 5, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 11, + "panels": [], + "repeat": null, + "title": "Cluster Health", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 12, + "x": 0, + "y": 1 + }, + "id": 5, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(up{job=~\"apiserver|kube-scheduler|kube-controller-manager\"} == 0)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "1,3", + "title": "Control Plane UP", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "UP", + "value": "null" + } + ], + "valueName": "total" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 12, + "x": 12, + "y": 1 + }, + "id": 6, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ALERTS{alertstate=\"firing\",alertname!=\"DeadMansSwitch\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "3,5", + "title": "Alerts Firing", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 5 + }, + "id": 12, + "panels": [], + "repeat": null, + "title": "Control Plane Status", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 6, + "x": 0, + "y": 6 + }, + "id": 1, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(up{job=\"apiserver\"} == 1) / count(up{job=\"apiserver\"})) * 100", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "50,80", + "title": "API Servers UP", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 6, + "x": 6, + "y": 6 + }, + "id": 2, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(up{job=\"kube-controller-manager-discovery\"} == 1) / count(up{job=\"kube-controller-manager-discovery\"})) * 100", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "50,80", + "title": "Controller Managers UP", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 6, + "x": 12, + "y": 6 + }, + "id": 3, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(up{job=\"kube-scheduler-discovery\"} == 1) / count(up{job=\"kube-scheduler-discovery\"})) * 100", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "50,80", + "title": "Schedulers UP", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 6, + "x": 18, + "y": 6 + }, + "hideTimeOverride": false, + "id": 4, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "count(increase(kube_pod_container_status_restarts{namespace=~\"kube-system|tectonic-system\"}[1h]) > 5)", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "1,3", + "title": "Crashlooping Control Plane Pods", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 11 + }, + "id": 13, + "panels": [], + "repeat": null, + "title": "Capacity Planing", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 0, + "y": 12 + }, + "id": 8, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(100 - (avg by (instance) (rate(node_cpu{job=\"node-exporter\",mode=\"idle\"}[5m])) * 100)) / count(node_cpu{job=\"node-exporter\",mode=\"idle\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "80,90", + "title": "CPU Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 6, + "y": 12 + }, + "id": 7, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "((sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - sum(node_memory_Cached)) / sum(node_memory_MemTotal)) * 100", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "80,90", + "title": "Memory Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 12, + "y": 12 + }, + "id": 9, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(node_filesystem_size{device!=\"rootfs\"}) - sum(node_filesystem_free{device!=\"rootfs\"})) / sum(node_filesystem_size{device!=\"rootfs\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "80,90", + "title": "Filesystem Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 18, + "y": 12 + }, + "id": 10, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "100 - (sum(kube_node_status_capacity_pods) - sum(kube_pod_info)) / sum(kube_node_status_capacity_pods) * 100", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "80,90", + "title": "Pod Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + } + ], + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Kubernetes Cluster Status", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/nginx.yaml b/grafana/values_overrides/nginx.yaml index 7c36c9584..daa3086a9 100644 --- a/grafana/values_overrides/nginx.yaml +++ b/grafana/values_overrides/nginx.yaml @@ -2,618 +2,1463 @@ # nginx conf: dashboards: - nginx_stats: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.5.2 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - annotations: - list: [] - description: Show stats from the hnlq715/nginx-vts-exporter. - editable: true - gnetId: 2949 - graphTooltip: 0 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 7 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum(nginx_upstream_responses_total{upstream=~"^$Upstream$"}) by (status_code, - upstream) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ status_code }}.{{ upstream }}" - metric: nginx_upstream_response - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: HTTP Response Codes by Upstream - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 6 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_upstream_requests_total{upstream=~"^$Upstream$"}[5m])) - by (upstream) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ upstream }}" - metric: nginx_upstream_requests - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Upstream Requests rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 5 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_upstream_bytes_total{upstream=~"^$Upstream$"}[5m])) by - (direction, upstream) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ direction }}.{{ upstream }}" - metric: nginx_upstream_bytes - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Upstream Bytes Transfer rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 1 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_connections_total[5m])) by (type) - format: time_series - intervalFactor: 2 - legendFormat: "{{ type }}" - metric: nginx_server_connections - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Overall Connections rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 4 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_cache_total{ server_zone=~"$ingress"}[5m])) by (server_zone, - type) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ type }}.{{ server_zone }}" - metric: nginx_server_cache - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Cache Action rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_requests_total{ server_zone=~"$ingress" }[5m])) by (server_zone) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ server_zone }}" - metric: nginx_server_requests - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Overall Requests rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 2 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_bytes_total{ server_zone=~"$ingress" }[5m])) by (direction, - server_zone) - format: time_series - intervalFactor: 2 - legendFormat: "{{ direction }}.{{ server_zone }}" - metric: nginx_server_bytes - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Overall Bytes Transferred rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: - - prometheus - - nginx - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: ".*" - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: - multi: true - name: Upstream - options: [] - query: label_values(nginx_upstream_bytes_total, upstream) - refresh: 1 - regex: '' - sort: 1 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: - multi: true - name: ingress - options: [] - query: label_values(nginx_bytes_total, server_zone) - refresh: 1 - regex: "/^[^\\*_]+$/" - sort: 1 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Nginx Stats - version: 13 + nginx_stats: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "Prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + }, + { + "datasource": "${DS_PROMETHEUS}", + "enable": true, + "expr": "sum(changes(nginx_ingress_controller_config_last_reload_successful_timestamp_seconds{instance!=\"unknown\",controller_class=~\"$controller_class\",namespace=~\"$namespace\"}[30s])) by (controller_class)", + "hide": false, + "iconColor": "rgba(255, 96, 96, 1)", + "limit": 100, + "name": "Config Reloads", + "showIn": 0, + "step": "30s", + "tagKeys": "controller_class", + "tags": [], + "titleFormat": "Config Reloaded", + "type": "tags" + } + ] + }, + "editable": true, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "links": [], + "panels": [ + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "ops", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 6, + "x": 0, + "y": 0 + }, + "id": 20, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "round(sum(irate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",namespace=~\"$namespace\"}[2m])), 0.001)", + "format": "time_series", + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "", + "title": "Controller Request Volume", + "transparent": false, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 6, + "x": 6, + "y": 0 + }, + "id": 82, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(avg_over_time(nginx_ingress_controller_nginx_process_connections{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\"}[2m]))", + "format": "time_series", + "instant": false, + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "", + "title": "Controller Connections", + "transparent": false, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percentunit", + "gauge": { + "maxValue": 100, + "minValue": 80, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": false + }, + "gridPos": { + "h": 3, + "w": 6, + "x": 12, + "y": 0 + }, + "id": 21, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",namespace=~\"$namespace\",status!~\"[4-5].*\"}[2m])) / sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",namespace=~\"$namespace\"}[2m]))", + "format": "time_series", + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "95, 99, 99.5", + "title": "Controller Success Rate (non-4|5xx responses)", + "transparent": false, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 3, + "x": 18, + "y": 0 + }, + "id": 81, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "avg(nginx_ingress_controller_success{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\"})", + "format": "time_series", + "instant": true, + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "", + "title": "Config Reloads", + "transparent": false, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 3, + "x": 21, + "y": 0 + }, + "id": 83, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "count(nginx_ingress_controller_config_last_reload_successful{controller_pod=~\"$controller\",controller_namespace=~\"$namespace\"} == 0)", + "format": "time_series", + "instant": true, + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "", + "title": "Last Config Failed", + "transparent": false, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "None", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 3 + }, + "height": "200px", + "id": 86, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "hideEmpty": false, + "hideZero": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 300, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "repeat": null, + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "round(sum(irate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\"}[2m])) by (ingress), 0.001)", + "format": "time_series", + "hide": false, + "instant": false, + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "metric": "network", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Ingress Request Volume", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "transparent": false, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "max - istio-proxy": "#890f02", + "max - master": "#bf1b00", + "max - prometheus": "#bf1b00" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": false, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 3 + }, + "id": 87, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "hideEmpty": true, + "hideZero": false, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 300, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",namespace=~\"$namespace\",ingress=~\"$ingress\",status!~\"[4-5].*\"}[2m])) by (ingress) / sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",namespace=~\"$namespace\",ingress=~\"$ingress\"}[2m])) by (ingress)", + "format": "time_series", + "instant": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Ingress Success Rate (non-4|5xx responses)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 1, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percentunit", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 6, + "w": 8, + "x": 0, + "y": 10 + }, + "height": "200px", + "id": 32, + "isNew": true, + "legend": { + "alignAsTable": false, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (irate (nginx_ingress_controller_request_size_sum{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\"}[2m]))", + "format": "time_series", + "instant": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "Received", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (irate (nginx_ingress_controller_response_size_sum{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\"}[2m]))", + "format": "time_series", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "Sent", + "metric": "network", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Network I/O pressure", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "transparent": false, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "max - istio-proxy": "#890f02", + "max - master": "#bf1b00", + "max - prometheus": "#bf1b00" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": false, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 6, + "w": 8, + "x": 8, + "y": 10 + }, + "id": 77, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "avg(nginx_ingress_controller_nginx_process_resident_memory_bytes{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\"}) ", + "format": "time_series", + "instant": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "nginx", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Average Memory Usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "max - istio-proxy": "#890f02", + "max - master": "#bf1b00" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 3, + "editable": false, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 6, + "w": 8, + "x": 16, + "y": 10 + }, + "height": "", + "id": 79, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "sort": null, + "sortDesc": null, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (nginx_ingress_controller_nginx_process_cpu_seconds_total{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\"}[2m])) ", + "format": "time_series", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "nginx", + "metric": "container_cpu", + "refId": "A", + "step": 10 + } + ], + "thresholds": [ + { + "colorMode": "critical", + "fill": true, + "line": true, + "op": "gt" + } + ], + "timeFrom": null, + "timeShift": null, + "title": "Average CPU Usage", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "transparent": false, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "columns": [], + "datasource": "${DS_PROMETHEUS}", + "fontSize": "100%", + "gridPos": { + "h": 8, + "w": 24, + "x": 0, + "y": 16 + }, + "hideTimeOverride": false, + "id": 75, + "links": [], + "pageSize": 7, + "repeat": null, + "repeatDirection": "h", + "scroll": true, + "showHeader": true, + "sort": { + "col": 1, + "desc": true + }, + "styles": [ + { + "alias": "Ingress", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "ingress", + "preserveFormat": false, + "sanitize": false, + "thresholds": [], + "type": "string", + "unit": "short" + }, + { + "alias": "Requests", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Value #A", + "thresholds": [ + "" + ], + "type": "number", + "unit": "ops" + }, + { + "alias": "Errors", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Value #B", + "thresholds": [], + "type": "number", + "unit": "ops" + }, + { + "alias": "P50 Latency", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "link": false, + "pattern": "Value #C", + "thresholds": [], + "type": "number", + "unit": "dtdurations" + }, + { + "alias": "P90 Latency", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "pattern": "Value #D", + "thresholds": [], + "type": "number", + "unit": "dtdurations" + }, + { + "alias": "P99 Latency", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "pattern": "Value #E", + "thresholds": [], + "type": "number", + "unit": "dtdurations" + }, + { + "alias": "IN", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Value #F", + "thresholds": [ + "" + ], + "type": "number", + "unit": "Bps" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Time", + "thresholds": [], + "type": "hidden", + "unit": "short" + }, + { + "alias": "OUT", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "mappingType": 1, + "pattern": "Value #G", + "thresholds": [], + "type": "number", + "unit": "Bps" + } + ], + "targets": [ + { + "expr": "histogram_quantile(0.50, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\"}[2m])) by (le, ingress))", + "format": "table", + "hide": false, + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "refId": "C" + }, + { + "expr": "histogram_quantile(0.90, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\"}[2m])) by (le, ingress))", + "format": "table", + "hide": false, + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "refId": "D" + }, + { + "expr": "histogram_quantile(0.99, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\"}[2m])) by (le, ingress))", + "format": "table", + "hide": false, + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{ destination_service }}", + "refId": "E" + }, + { + "expr": "sum(irate(nginx_ingress_controller_request_size_sum{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\"}[2m])) by (ingress)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "refId": "F" + }, + { + "expr": "sum(irate(nginx_ingress_controller_response_size_sum{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\"}[2m])) by (ingress)", + "format": "table", + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "refId": "G" + } + ], + "timeFrom": null, + "title": "Ingress Percentile Response Times and Transfer Rates", + "transform": "table", + "transparent": false, + "type": "table" + }, + { + "columns": [ + { + "text": "Current", + "value": "current" + } + ], + "datasource": "${DS_PROMETHEUS}", + "fontSize": "100%", + "gridPos": { + "h": 8, + "w": 24, + "x": 0, + "y": 24 + }, + "height": "1024", + "id": 85, + "links": [], + "pageSize": 7, + "scroll": true, + "showHeader": true, + "sort": { + "col": 1, + "desc": false + }, + "styles": [ + { + "alias": "Time", + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "pattern": "Time", + "type": "date" + }, + { + "alias": "TTL", + "colorMode": "cell", + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "pattern": "Current", + "thresholds": [ + "0", + "691200" + ], + "type": "number", + "unit": "s" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "decimals": 2, + "pattern": "/.*/", + "thresholds": [], + "type": "number", + "unit": "short" + } + ], + "targets": [ + { + "expr": "avg(nginx_ingress_controller_ssl_expire_time_seconds{kubernetes_pod_name=~\"$controller\",namespace=~\"$namespace\",ingress=~\"$ingress\"}) by (host) - time()", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{ host }}", + "metric": "gke_letsencrypt_cert_expiration", + "refId": "A", + "step": 1 + } + ], + "title": "Ingress Certificate Expiry", + "transform": "timeseries_aggregations", + "type": "table" + } + ], + "refresh": "5s", + "schemaVersion": 16, + "style": "dark", + "tags": [ + "nginx" + ], + "templating": { + "list": [ + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "hide": 0, + "includeAll": true, + "label": "Namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(nginx_ingress_controller_config_hash, controller_namespace)", + "refresh": 1, + "regex": "", + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "hide": 0, + "includeAll": true, + "label": "Controller Class", + "multi": false, + "name": "controller_class", + "options": [], + "query": "label_values(nginx_ingress_controller_config_hash{namespace=~\"$namespace\"}, controller_class) ", + "refresh": 1, + "regex": "", + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "hide": 0, + "includeAll": true, + "label": "Controller", + "multi": false, + "name": "controller", + "options": [], + "query": "label_values(nginx_ingress_controller_config_hash{namespace=~\"$namespace\",controller_class=~\"$controller_class\"}, controller_pod) ", + "refresh": 1, + "regex": "", + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": { + "tags": [], + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "hide": 0, + "includeAll": true, + "label": "Ingress", + "multi": false, + "name": "ingress", + "options": [], + "query": "label_values(nginx_ingress_controller_requests{namespace=~\"$namespace\",controller_class=~\"$controller_class\",controller=~\"$controller\"}, ingress) ", + "refresh": 1, + "regex": "", + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "2m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "NGINX Ingress controller", + "uid": "nginx", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/nodes.yaml b/grafana/values_overrides/nodes.yaml index 0c28bd890..a2d30678d 100644 --- a/grafana/values_overrides/nodes.yaml +++ b/grafana/values_overrides/nodes.yaml @@ -2,754 +2,977 @@ # the status of all nodes in a deployment conf: dashboards: - nodes: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.4.1 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: [] - description: Dashboard to get an overview of one server - editable: true - gnetId: 22 - graphTooltip: 0 - hideControls: false - id: - links: [] - refresh: false - rows: - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: 100 - (avg by (cpu) (irate(node_cpu{mode="idle", instance="$server"}[5m])) - * 100) - hide: false - intervalFactor: 10 - legendFormat: "{{cpu}}" - refId: A - step: 50 - thresholds: [] - timeFrom: - timeShift: - title: Idle cpu - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percent - label: cpu usage - logBase: 1 - max: 100 - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 9 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: node_load1{instance="$server"} - intervalFactor: 4 - legendFormat: load 1m - refId: A - step: 20 - target: '' - - expr: node_load5{instance="$server"} - intervalFactor: 4 - legendFormat: load 5m - refId: B - step: 20 - target: '' - - expr: node_load15{instance="$server"} - intervalFactor: 4 - legendFormat: load 15m - refId: C - step: 20 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: System load - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percentunit - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 4 - legend: - alignAsTable: false - avg: false - current: false - hideEmpty: false - hideZero: false - max: false - min: false - rightSide: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: node_memory_SwapFree{instance="172.17.0.1:9100",job="prometheus"} - yaxis: 2 - spaceLength: 10 - span: 9 - stack: true - steppedLine: false - targets: - - expr: node_memory_MemTotal{instance="$server"} - node_memory_MemFree{instance="$server"} - - node_memory_Buffers{instance="$server"} - node_memory_Cached{instance="$server"} - hide: false - interval: '' - intervalFactor: 2 - legendFormat: memory used - metric: '' - refId: C - step: 10 - - expr: node_memory_Buffers{instance="$server"} - interval: '' - intervalFactor: 2 - legendFormat: memory buffers - metric: '' - refId: E - step: 10 - - expr: node_memory_Cached{instance="$server"} - intervalFactor: 2 - legendFormat: memory cached - metric: '' - refId: F - step: 10 - - expr: node_memory_MemFree{instance="$server"} - intervalFactor: 2 - legendFormat: memory free - metric: '' - refId: D - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Memory usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 5 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: ((node_memory_MemTotal{instance="$server"} - node_memory_MemFree{instance="$server"} - - node_memory_Buffers{instance="$server"} - node_memory_Cached{instance="$server"}) - / node_memory_MemTotal{instance="$server"}) * 100 - intervalFactor: 2 - refId: A - step: 60 - target: '' - thresholds: 80, 90 - title: Memory usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 6 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: read - yaxis: 1 - - alias: '{instance="172.17.0.1:9100"}' - yaxis: 2 - - alias: io time - yaxis: 2 - spaceLength: 10 - span: 9 - stack: false - steppedLine: false - targets: - - expr: sum by (instance) (rate(node_disk_bytes_read{instance="$server"}[2m])) - hide: false - intervalFactor: 4 - legendFormat: read - refId: A - step: 20 - target: '' - - expr: sum by (instance) (rate(node_disk_bytes_written{instance="$server"}[2m])) - intervalFactor: 4 - legendFormat: written - refId: B - step: 20 - - expr: sum by (instance) (rate(node_disk_io_time_ms{instance="$server"}[2m])) - intervalFactor: 4 - legendFormat: io time - refId: C - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Disk I/O - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: ms - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percentunit - gauge: - maxValue: 1 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 7 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(node_filesystem_size{device!="rootfs",instance="$server"}) - sum(node_filesystem_free{device!="rootfs",instance="$server"})) - / sum(node_filesystem_size{device!="rootfs",instance="$server"}) - intervalFactor: 2 - refId: A - step: 60 - target: '' - thresholds: 0.75, 0.9 - title: Disk space usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 8 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: 'transmitted ' - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: rate(node_network_receive_bytes{instance="$server",device!~"lo"}[5m]) - hide: false - intervalFactor: 2 - legendFormat: "{{device}}" - refId: A - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Network received - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 10 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: 'transmitted ' - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: rate(node_network_transmit_bytes{instance="$server",device!~"lo"}[5m]) - hide: false - intervalFactor: 2 - legendFormat: "{{device}}" - refId: B - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Network transmitted - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: bytes - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Server - multi: false - name: host - options: [] - query: label_values(node_uname_info, nodename) - refresh: 1 - regex: '' - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 2 - includeAll: false - label: Instance - multi: false - name: server - options: [] - query: label_values(node_uname_info{nodename="$host"}, instance) - refresh: 1 - regex: '' - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Nodes - version: 2 - inputs: - - name: prometheus - pluginId: prometheus - type: datasource - value: prometheus - overwrite: true + nodes: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.4.1" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Dashboard to get an overview of one server", + "overwrite": true, + "editable": true, + "gnetId": 22, + "graphTooltip": 0, + "id": 8, + "links": [], + "panels": [ + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 0 + }, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "100 - (avg by (cpu) (irate(node_cpu{mode=\"idle\", instance=\"$server\"}[5m])) * 100)", + "hide": false, + "intervalFactor": 10, + "legendFormat": "{{cpu}}", + "refId": "A", + "step": 50 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Idle cpu", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percent", + "label": "cpu usage", + "logBase": 1, + "max": 100, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 0 + }, + "id": 9, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "node_load1{instance=\"$server\"}", + "intervalFactor": 4, + "legendFormat": "load 1m", + "refId": "A", + "step": 20, + "target": "" + }, + { + "expr": "node_load5{instance=\"$server\"}", + "intervalFactor": 4, + "legendFormat": "load 5m", + "refId": "B", + "step": 20, + "target": "" + }, + { + "expr": "node_load15{instance=\"$server\"}", + "intervalFactor": 4, + "legendFormat": "load 15m", + "refId": "C", + "step": 20, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "System load", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percentunit", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 18, + "x": 0, + "y": 7 + }, + "id": 4, + "legend": { + "alignAsTable": false, + "avg": false, + "current": false, + "hideEmpty": false, + "hideZero": false, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "node_memory_SwapFree{instance=\"$server\",job=\"prometheus\"}", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "node_memory_MemTotal{instance=\"$server\"} - node_memory_MemFree{instance=\"$server\"} - node_memory_Buffers{instance=\"$server\"} - node_memory_Cached{instance=\"$server\"}", + "hide": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "memory used", + "metric": "", + "refId": "C", + "step": 10 + }, + { + "expr": "node_memory_Buffers{instance=\"$server\"}", + "interval": "", + "intervalFactor": 2, + "legendFormat": "memory buffers", + "metric": "", + "refId": "E", + "step": 10 + }, + { + "expr": "node_memory_Cached{instance=\"$server\"}", + "intervalFactor": 2, + "legendFormat": "memory cached", + "metric": "", + "refId": "F", + "step": 10 + }, + { + "expr": "node_memory_MemFree{instance=\"$server\"}", + "intervalFactor": 2, + "legendFormat": "memory free", + "metric": "", + "refId": "D", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 7 + }, + "id": 5, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "((node_memory_MemTotal{instance=\"$server\"} - node_memory_MemFree{instance=\"$server\"} - node_memory_Buffers{instance=\"$server\"} - node_memory_Cached{instance=\"$server\"}) / node_memory_MemTotal{instance=\"$server\"}) * 100", + "intervalFactor": 2, + "refId": "A", + "step": 60, + "target": "" + } + ], + "thresholds": "80, 90", + "title": "Memory usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 18, + "x": 0, + "y": 14 + }, + "id": 6, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "read", + "yaxis": 1 + }, + { + "alias": "{instance=\"$server\"}", + "yaxis": 2 + }, + { + "alias": "io time", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (instance) (rate(node_disk_bytes_read{instance=\"$server\"}[2m]))", + "hide": false, + "intervalFactor": 4, + "legendFormat": "read", + "refId": "A", + "step": 20, + "target": "" + }, + { + "expr": "sum by (instance) (rate(node_disk_bytes_written{instance=\"$server\"}[2m]))", + "intervalFactor": 4, + "legendFormat": "written", + "refId": "B", + "step": 20 + }, + { + "expr": "sum by (instance) (rate(node_disk_io_time_ms{instance=\"$server\"}[2m]))", + "intervalFactor": 4, + "legendFormat": "io time", + "refId": "C", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Disk I/O", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percentunit", + "gauge": { + "maxValue": 1, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 14 + }, + "id": 7, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(node_filesystem_size{device!=\"rootfs\",instance=\"$server\"}) - sum(node_filesystem_free{device!=\"rootfs\",instance=\"$server\"})) / sum(node_filesystem_size{device!=\"rootfs\",instance=\"$server\"})", + "intervalFactor": 2, + "refId": "A", + "step": 60, + "target": "" + } + ], + "thresholds": "0.75, 0.9", + "title": "Disk space usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 21 + }, + "id": 8, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "transmitted ", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(node_network_receive_bytes{instance=\"$server\",device!~\"lo\"}[5m])", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{device}}", + "refId": "A", + "step": 10, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network received", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 21 + }, + "id": 10, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "transmitted ", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(node_network_transmit_bytes{instance=\"$server\",device!~\"lo\"}[5m])", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{device}}", + "refId": "B", + "step": 10, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network transmitted", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Server", + "multi": false, + "name": "host", + "options": [], + "query": "label_values(node_uname_info, nodename)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 2, + "includeAll": false, + "label": "Instance", + "multi": false, + "name": "server", + "options": [], + "query": "label_values(node_uname_info{nodename=\"$host\"}, instance)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Nodes", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/openstack.yaml b/grafana/values_overrides/openstack.yaml index d143a7967..fb35b6fb2 100644 --- a/grafana/values_overrides/openstack.yaml +++ b/grafana/values_overrides/openstack.yaml @@ -3,3011 +3,4160 @@ # rabbitmq conf: dashboards: - rabbitmq: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.2.0 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: [] - editable: true - gnetId: 2121 - graphTooltip: 0 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: 266 - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 13 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: rabbitmq_up{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - metric: rabbitmq_up{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - refId: A - step: 2 - thresholds: Up,Down - timeFrom: 30s - title: RabbitMQ Server - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - - op: "=" - text: Down - value: '0' - - op: "=" - text: Up - value: '1' - valueName: current - - alert: - conditions: - - evaluator: - params: - - 1 - type: lt - operator: - type: and - query: - params: - - A - - 10s - - now - reducer: - params: [] - type: last - type: query - - evaluator: - params: [] - type: no_value - operator: - type: and - query: - params: - - A - - 10s - - now - reducer: - params: [] - type: last - type: query - executionErrorState: alerting - frequency: 60s - handler: 1 - message: Some of the RabbitMQ node is down - name: Node Stats alert - noDataState: no_data - notifications: [] - aliasColors: {} - bars: true - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 12 - legend: - alignAsTable: true - avg: false - current: true - max: false - min: false - show: true - total: false - values: true - lines: false - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 9 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_running{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}" - metric: rabbitmq_running - refId: A - step: 2 - thresholds: - - colorMode: critical - fill: true - line: true - op: lt - value: 1 - timeFrom: 30s - timeShift: - title: Node up Stats - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 6 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_exchangesTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:exchanges" - metric: rabbitmq_exchangesTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Exchanges - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 4 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_channelsTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:channels" - metric: rabbitmq_channelsTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Channels - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 3 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_consumersTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:consumers" - metric: rabbitmq_consumersTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Consumers - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 5 - legend: - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_connectionsTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:connections" - metric: rabbitmq_connectionsTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Connections - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 7 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_queuesTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:queues" - metric: rabbitmq_queuesTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Queues - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 8 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum by (vhost)(rabbitmq_queue_messages_ready{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}) - intervalFactor: 2 - legendFormat: "{{vhost}}:ready" - metric: rabbitmq_queue_messages_ready - refId: A - step: 2 - - expr: sum by (vhost)(rabbitmq_queue_messages_published_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}) - intervalFactor: 2 - legendFormat: "{{vhost}}:published" - metric: rabbitmq_queue_messages_published_total - refId: B - step: 2 - - expr: sum by (vhost)(rabbitmq_queue_messages_delivered_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}) - intervalFactor: 2 - legendFormat: "{{vhost}}:delivered" - metric: rabbitmq_queue_messages_delivered_total - refId: C - step: 2 - - expr: sum by (vhost)(rabbitmq_queue_messages_unacknowledged{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}) - intervalFactor: 2 - legendFormat: "{{vhost}}:unack" - metric: ack - refId: D - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Messages/host - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 2 - legend: - alignAsTable: true - avg: false - current: true - max: false - min: false - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_queue_messages{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{queue}}:{{durable}}" - metric: rabbitmq_queue_messages - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Messages / Queue - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 9 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_node_mem_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:used" - metric: rabbitmq_node_mem_used - refId: A - step: 2 - - expr: rabbitmq_node_mem_limit{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:limit" - metric: node_mem - refId: B - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Memory - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: decbytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 10 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_fd_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:used" - metric: '' - refId: A - step: 2 - - expr: rabbitmq_fd_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:total" - metric: node_mem - refId: B - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: FIle descriptors - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 11 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_sockets_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:used" - metric: '' - refId: A - step: 2 - - expr: rabbitmq_sockets_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:total" - metric: '' - refId: B - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Sockets - tooltip: - shared: true - sort: 0 - value_type: individual - transparent: false - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: {} - hide: 0 - label: null - name: rabbit - options: [] - type: query - query: label_values(rabbitmq_up, release_group) - refresh: 1 - sort: 1 - datasource: "${DS_PROMETHEUS}" - time: - from: now-5m - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: RabbitMQ Metrics - version: 17 - description: 'Basic rabbitmq host stats: Node Stats, Exchanges, Channels, Consumers, Connections, - Queues, Messages, Messages per Queue, Memory, File Descriptors, Sockets.' - openstack_control_plane: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.5.2 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: panel - id: text - name: Text - version: '' - annotations: - list: [] - editable: true - gnetId: - graphTooltip: 1 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: 250px - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 24 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=keystone - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_keystone_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Keystone - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 23 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=glance - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_glance_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Glance - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(202, 58, 40, 0.86) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 22 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=heat - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_heat_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Heat - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 21 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=neutron - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_neutron_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Neutron - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 20 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=nova - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_nova_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Nova - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 19 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=swift - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_swift_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Ceph - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 18 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=cinder - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_cinder_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Cinder - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 17 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=placement - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_placement_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Placement - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 16 - interval: "> 60s" - links: - - dashboard: RabbitMQ Metrics - name: Drilldown dashboard - title: RabbitMQ Metrics - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: min(rabbitmq_up) - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: RabbitMQ - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 15 - interval: "> 60s" - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: min(mysql_global_status_wsrep_ready) - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: MariaDB - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(225, 177, 40, 0.59) - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 14 - interval: "> 60s" - links: - - dashboard: Nginx Stats - name: Drilldown dashboard - title: Nginx Stats - type: dashboard - mappingType: 2 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: '1' - text: OK - to: '99999999999999' - - from: '0' - text: CRIT - to: '0' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: sum_over_time(nginx_connections_total{type="active", namespace="openstack"}[5m]) - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '0,1' - title: Nginx - type: singlestat - valueFontSize: 50% - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 13 - interval: "> 60s" - links: - - dashboard: Memcached - name: Drilldown dashboard - title: Memcached - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: min(memcached_up) - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Memcached - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: OpenStack Services - titleSize: h6 - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 11 - interval: "> 60s" - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 3 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - alias: free - column: value - expr: openstack_total_used_vcpus{job="openstack-metrics", region="$region"} + openstack_total_free_vcpus{job="openstack-metrics", - region="$region"} - format: time_series - function: min - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - - alias: used - column: value - expr: openstack_total_used_vcpus{job="openstack-metrics", region="$region"} - format: time_series - function: max - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: B - resultFormat: time_series - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: VCPUs (total vs used) - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 12 - interval: "> 60s" - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 3 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - alias: free - column: value - expr: openstack_total_used_ram_MB{job="openstack-metrics", region="$region"} + openstack_total_free_ram_MB{job="openstack-metrics", - region="$region"} - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - - alias: used - column: value - expr: openstack_total_used_ram_MB{job="openstack-metrics", region="$region"} - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: B - resultFormat: time_series - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: RAM (total vs used) - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: mbytes - label: '' - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 13 - interval: "> 60s" - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 3 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - alias: free - column: value - expr: openstack_total_used_disk_GB{job="openstack-metrics", region="$region"} + openstack_total_free_disk_GB{job="openstack-metrics", - region="$region"} - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - - alias: used - column: value - expr: openstack_total_used_disk_GB{job="openstack-metrics", region="$region"} - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: B - resultFormat: time_series - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: Disk (used vs total) - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: gbytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes": false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 27 - interval: "> 60s" - legend: - alignAsTable: false - avg: true - current: true - hideEmpty: true - hideZero: false - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 4 - links: [] - nullPointMode: null - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - alias: free - column: value - expr: sum(openstack_running_instances) - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - interval: "15s" - intervalFactor: 1 - legendFormat: "{{ running_vms }}" - policy: default - rawQuery: false - refID: A - resultFormat: time_series - - alias: used - column: value - expr: sum(openstack_total_running_instances) - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - interval: "15s" - intervalFactor: 1 - legendFormat: "{{ total_vms }}" - policy: default - rawQuery: false - refID: B - resultFormat: time_series - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: OpenStack Instances - tooltip: - msResolution: false - shared: true - sort : 0 - value_type: cumulative - transparent: true - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: none - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Virtual resources - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - enable: true - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: - multi: false - name: region - options: [] - query: label_values(openstack_exporter_cache_refresh_duration_seconds, region) - refresh: 1 - regex: '' - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - time: - from: now-1h - to: now - timepicker: - collapse: false - enable: true - notice: false - now: true - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - status: Stable - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - type: timepicker - timezone: browser - title: OpenStack Metrics - version: 2 - openstack-service: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.5.2 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - enable: true - list: [] - editable: true - gnetId: - graphTooltip: 1 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: 250px - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(225, 177, 40, 0.59) - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 6 - interval: "> 60s" - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_[[Service]]_api{job="openstack-metrics"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '0,1' - title: '' - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: CRITICAL - value: '0' - - op: "=" - text: OK - value: '1' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 13 - interval: "> 60s" - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - column: value - condition: '' - expr: sum(nginx_responses_total{server_zone=~"[[Service]].*", status_code="5xx"}) - fill: '' - format: time_series - function: count - groupBy: - - interval: auto - params: - - auto - type: time - - params: - - '0' - type: fill - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - tags: [] - thresholds: '' - title: HTTP 5xx errors - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: '0' - value: 'null' - valueName: current - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 0 - grid: {} - id: 7 - interval: ">60s" - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 8 - stack: false - steppedLine: false - targets: - - expr: sum(nginx_upstream_response_msecs_avg{upstream=~"openstack-[[Service]].*"}) - by (upstream) - format: time_series - intervalFactor: 2 - refId: A - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: HTTP response time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 9 - interval: "> 60s" - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: true - targets: - - alias: healthy - column: value - expr: openstack_check_[[Service]]_api - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - select: [] - step: 120 - tags: [] - thresholds: [] - timeFrom: - timeShift: - title: API Availability - tooltip: - msResolution: false - shared: false - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: none - label: '' - logBase: 1 - max: 1 - min: 0 - show: false - - format: short - logBase: 1 - max: - min: - show: false - - aliasColors: - '{status_code="2xx"}': "#629E51" - '{status_code="5xx"}': "#BF1B00" - bars: true - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 0 - grid: {} - id: 8 - interval: "> 60s" - legend: - alignAsTable: false - avg: false - current: false - hideEmpty: false - max: false - min: false - rightSide: false - show: true - total: false - values: false - lines: false - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 8 - stack: true - steppedLine: false - targets: - - expr: sum(nginx_responses_total{server_zone=~"[[Service]].*"}) by (status_code) - format: time_series - intervalFactor: 2 - refId: A - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: Number of HTTP responses - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Service Status - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - enable: true - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: - current: - tags: [] - text: cinder - value: cinder - hide: 0 - includeAll: false - label: - multi: false - name: Service - options: - - selected: false - text: nova - value: nova - - selected: false - text: glance - value: glance - - selected: false - text: keystone - value: keystone - - selected: true - text: cinder - value: cinder - - selected: false - text: heat - value: heat - - selected: false - text: placement - value: placement - - selected: false - text: neutron - value: neutron - query: nova,glance,keystone,cinder,heat,placement,neutron - type: custom - time: - from: now-1h - to: now - timepicker: - collapse: false - enable: true - notice: false - now: true - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - status: Stable - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - type: timepicker - timezone: browser - title: Openstack Service - version: 4 + rabbitmq: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "Prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [] + }, + "editable": true, + "overwrite": true, + "gnetId": 2121, + "graphTooltip": 0, + "hideControls": false, + "id": null, + "links": [], + "refresh": "5s", + "rows": [ + { + "collapse": false, + "height": 266, + "panels": [ + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "id": 13, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "span": 3, + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "targets": [ + { + "expr": "rabbitmq_up", + "intervalFactor": 2, + "metric": "rabbitmq_up", + "refId": "A", + "step": 2 + } + ], + "thresholds": "Up,Down", + "timeFrom": "30s", + "title": "RabbitMQ Server", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + }, + { + "op": "=", + "text": "Down", + "value": "0" + }, + { + "op": "=", + "text": "Up", + "value": "1" + } + ], + "valueName": "current" + }, + { + "alert": { + "conditions": [ + { + "evaluator": { + "params": [ + 1 + ], + "type": "lt" + }, + "operator": { + "type": "and" + }, + "query": { + "params": [ + "A", + "10s", + "now" + ] + }, + "reducer": { + "params": [], + "type": "last" + }, + "type": "query" + }, + { + "evaluator": { + "params": [], + "type": "no_value" + }, + "operator": { + "type": "and" + }, + "query": { + "params": [ + "A", + "10s", + "now" + ] + }, + "reducer": { + "params": [], + "type": "last" + }, + "type": "query" + } + ], + "executionErrorState": "alerting", + "frequency": "60s", + "handler": 1, + "message": "Some of the RabbitMQ node is down", + "name": "Node Stats alert", + "noDataState": "no_data", + "notifications": [] + }, + "aliasColors": {}, + "bars": true, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "id": 12, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": false, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 9, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_running", + "intervalFactor": 2, + "legendFormat": "{{node}}", + "metric": "rabbitmq_running", + "refId": "A", + "step": 2 + } + ], + "thresholds": [ + { + "colorMode": "critical", + "fill": true, + "line": true, + "op": "lt", + "value": 1 + } + ], + "timeFrom": "30s", + "timeShift": null, + "title": "Node up Stats", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "id": 6, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 4, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_exchangesTotal", + "intervalFactor": 2, + "legendFormat": "{{instance}}:exchanges", + "metric": "rabbitmq_exchangesTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Exchanges", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "id": 4, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 4, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_channelsTotal", + "intervalFactor": 2, + "legendFormat": "{{instance}}:channels", + "metric": "rabbitmq_channelsTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Channels", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "id": 3, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 4, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_consumersTotal", + "intervalFactor": 2, + "legendFormat": "{{instance}}:consumers", + "metric": "rabbitmq_consumersTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Consumers", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "id": 5, + "legend": { + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 4, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_connectionsTotal", + "intervalFactor": 2, + "legendFormat": "{{instance}}:connections", + "metric": "rabbitmq_connectionsTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Connections", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "id": 7, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 4, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_queuesTotal", + "intervalFactor": 2, + "legendFormat": "{{instance}}:queues", + "metric": "rabbitmq_queuesTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Queues", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "id": 8, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 6, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (vhost)(rabbitmq_queue_messages_ready)", + "intervalFactor": 2, + "legendFormat": "{{vhost}}:ready", + "metric": "rabbitmq_queue_messages_ready", + "refId": "A", + "step": 2 + }, + { + "expr": "sum by (vhost)(rabbitmq_queue_messages_published_total)", + "intervalFactor": 2, + "legendFormat": "{{vhost}}:published", + "metric": "rabbitmq_queue_messages_published_total", + "refId": "B", + "step": 2 + }, + { + "expr": "sum by (vhost)(rabbitmq_queue_messages_delivered_total)", + "intervalFactor": 2, + "legendFormat": "{{vhost}}:delivered", + "metric": "rabbitmq_queue_messages_delivered_total", + "refId": "C", + "step": 2 + }, + { + "expr": "sum by (vhost)(rabbitmq_queue_messages_unacknowledged)", + "intervalFactor": 2, + "legendFormat": "{{vhost}}:unack", + "metric": "ack", + "refId": "D", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Messages/host", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "id": 2, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 6, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_queue_messages", + "intervalFactor": 2, + "legendFormat": "{{queue}}:{{durable}}", + "metric": "rabbitmq_queue_messages", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Messages / Queue", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "id": 9, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 6, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_node_mem_used", + "intervalFactor": 2, + "legendFormat": "{{node}}:used", + "metric": "rabbitmq_node_mem_used", + "refId": "A", + "step": 2 + }, + { + "expr": "rabbitmq_node_mem_limit", + "intervalFactor": 2, + "legendFormat": "{{node}}:limit", + "metric": "node_mem", + "refId": "B", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Memory", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "id": 10, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 6, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_fd_used", + "intervalFactor": 2, + "legendFormat": "{{node}}:used", + "metric": "", + "refId": "A", + "step": 2 + }, + { + "expr": "rabbitmq_fd_total", + "intervalFactor": 2, + "legendFormat": "{{node}}:total", + "metric": "node_mem", + "refId": "B", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "FIle descriptors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "id": 11, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "span": 6, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_sockets_used", + "intervalFactor": 2, + "legendFormat": "{{node}}:used", + "metric": "", + "refId": "A", + "step": 2 + }, + { + "expr": "rabbitmq_sockets_total", + "intervalFactor": 2, + "legendFormat": "{{node}}:total", + "metric": "", + "refId": "B", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Sockets", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "transparent": false, + "type": "graph", + "xaxis": { + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + } + ], + "repeat": null, + "repeatIteration": null, + "repeatRowId": null, + "showTitle": false, + "title": "Dashboard Row", + "titleSize": "h6" + } + ], + "schemaVersion": 14, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "tags": [], + "text": "Prometheus", + "value": "Prometheus" + }, + "hide": 0, + "label": null, + "name": "datasource", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "type": "datasource" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "RabbitMQ Metrics", + "version": 17, + "description": "Basic rabbitmq host stats: Node Stats, Exchanges, Channels, Consumers, Connections, Queues, Messages, Messages per Queue, Memory, File Descriptors, Sockets." + } + openstack_control_plane: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.5.2" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + }, + { + "type": "panel", + "id": "text", + "name": "Text", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 1, + "id": 11, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 28, + "panels": [], + "repeat": null, + "title": "OpenStack Services", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 0, + "y": 1 + }, + "id": 24, + "interval": "> 60s", + "links": [ + { + "dashboard": "Openstack Service", + "name": "Drilldown dashboard", + "params": "var-Service=keystone", + "title": "Openstack Service", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_keystone_api{job=\"openstack-metrics\", region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Keystone", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 2, + "y": 1 + }, + "id": 23, + "interval": "> 60s", + "links": [ + { + "dashboard": "Openstack Service", + "name": "Drilldown dashboard", + "params": "var-Service=glance", + "title": "Openstack Service", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_glance_api{job=\"openstack-metrics\", region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Glance", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(202, 58, 40, 0.86)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 4, + "y": 1 + }, + "id": 22, + "interval": "> 60s", + "links": [ + { + "dashboard": "Openstack Service", + "name": "Drilldown dashboard", + "params": "var-Service=heat", + "title": "Openstack Service", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_heat_api{job=\"openstack-metrics\", region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Heat", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 6, + "y": 1 + }, + "id": 21, + "interval": "> 60s", + "links": [ + { + "dashboard": "Openstack Service", + "name": "Drilldown dashboard", + "params": "var-Service=neutron", + "title": "Openstack Service", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_neutron_api{job=\"openstack-metrics\", region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Neutron", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(208, 53, 34, 0.82)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 8, + "y": 1 + }, + "id": 20, + "interval": "> 60s", + "links": [ + { + "dashboard": "Openstack Service", + "name": "Drilldown dashboard", + "params": "var-Service=nova", + "title": "Openstack Service", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_nova_api{job=\"openstack-metrics\", region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Nova", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 10, + "y": 1 + }, + "id": 19, + "interval": "> 60s", + "links": [ + { + "dashboard": "Openstack Service", + "name": "Drilldown dashboard", + "params": "var-Service=swift", + "title": "Openstack Service", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_swift_api{job=\"openstack-metrics\", region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Ceph", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 12, + "y": 1 + }, + "id": 18, + "interval": "> 60s", + "links": [ + { + "dashboard": "Openstack Service", + "name": "Drilldown dashboard", + "params": "var-Service=cinder", + "title": "Openstack Service", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_cinder_api{job=\"openstack-metrics\", region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Cinder", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 14, + "y": 1 + }, + "id": 17, + "interval": "> 60s", + "links": [ + { + "dashboard": "Openstack Service", + "name": "Drilldown dashboard", + "params": "var-Service=placement", + "title": "Openstack Service", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_placement_api{job=\"openstack-metrics\", region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Placement", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(208, 53, 34, 0.82)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 16, + "y": 1 + }, + "id": 16, + "interval": "> 60s", + "links": [ + { + "dashboard": "RabbitMQ Metrics", + "name": "Drilldown dashboard", + "title": "RabbitMQ Metrics", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "min(rabbitmq_up)", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "RabbitMQ", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(208, 53, 34, 0.82)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 18, + "y": 1 + }, + "id": 15, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "min(mysql_global_status_wsrep_ready)", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "MariaDB", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(208, 53, 34, 0.82)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 20, + "y": 1 + }, + "id": 14, + "interval": "> 60s", + "links": [ + { + "dashboard": "Nginx Stats", + "name": "Drilldown dashboard", + "title": "Nginx Stats", + "type": "dashboard" + } + ], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "1", + "text": "OK", + "to": "99999999999999" + }, + { + "from": "0", + "text": "CRIT", + "to": "0" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum_over_time(nginx_connections_total{type=\"active\", namespace=\"openstack\"}[5m])", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Nginx", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(208, 53, 34, 0.82)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 22, + "y": 1 + }, + "id": 13, + "interval": "> 60s", + "links": [ + { + "dashboard": "Memcached", + "name": "Drilldown dashboard", + "title": "Memcached", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "min(memcached_up)", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Memcached", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 2, + "x": 22, + "y": 8 + }, + "id": 13, + "interval": "> 60s", + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "alias": "free", + "column": "value", + "expr": "openstack_total_used_disk_GB{job=\"openstack-metrics\", region=\"$region\"} + openstack_total_free_disk_GB{job=\"openstack-metrics\", region=\"$region\"}", + "format": "time_series", + "function": "mean", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + }, + { + "alias": "used", + "column": "value", + "expr": "openstack_total_used_disk_GB{job=\"openstack-metrics\", region=\"$region\"}", + "format": "time_series", + "function": "mean", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "B", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Disk (used vs total)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "gbytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 15 + }, + "id": 29, + "panels": [], + "repeat": null, + "title": "Virtual resources", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 16 + }, + "id": 11, + "interval": "> 60s", + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "alias": "free", + "column": "value", + "expr": "openstack_total_used_vcpus{job=\"openstack-metrics\", region=\"$region\"} + openstack_total_free_vcpus{job=\"openstack-metrics\", region=\"$region\"}", + "format": "time_series", + "function": "min", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + }, + { + "alias": "used", + "column": "value", + "expr": "openstack_total_used_vcpus{job=\"openstack-metrics\", region=\"$region\"}", + "format": "time_series", + "function": "max", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "B", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "VCPUs (total vs used)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 16 + }, + "id": 12, + "interval": "> 60s", + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "alias": "free", + "column": "value", + "expr": "openstack_total_used_ram_MB{job=\"openstack-metrics\", region=\"$region\"} + openstack_total_free_ram_MB{job=\"openstack-metrics\", region=\"$region\"}", + "format": "time_series", + "function": "mean", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + }, + { + "alias": "used", + "column": "value", + "expr": "openstack_total_used_ram_MB{job=\"openstack-metrics\", region=\"$region\"}", + "format": "time_series", + "function": "mean", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "B", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "RAM (total vs used)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "mbytes", + "label": "", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "dashes\"": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 23 + }, + "id": 27, + "interval": "> 60s", + "legend": { + "alignAsTable": false, + "avg": true, + "current": true, + "hideEmpty": true, + "hideZero": false, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 4, + "links": [], + "nullPointMode": null, + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "alias": "free", + "column": "value", + "expr": "sum(openstack_running_instances)", + "format": "time_series", + "function": "mean", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "interval": "15s", + "intervalFactor": 1, + "legendFormat": "{{ running_vms }}", + "policy": "default", + "rawQuery": false, + "refID": "A", + "refId": "A", + "resultFormat": "time_series" + }, + { + "alias": "used", + "column": "value", + "expr": "sum(openstack_total_running_instances)", + "format": "time_series", + "function": "mean", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "interval": "15s", + "intervalFactor": 1, + "legendFormat": "{{ total_vms }}", + "policy": "default", + "rawQuery": false, + "refID": "B", + "refId": "B", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "OpenStack Instances", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "transparent": true, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": null, + "multi": false, + "name": "region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "collapse": false, + "enable": true, + "notice": false, + "now": true, + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "status": "Stable", + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ], + "type": "timepicker" + }, + "timezone": "browser", + "title": "OpenStack Metrics", + "version": 1 + } + openstack-service: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.5.2" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "enable": true, + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 1, + "id": 29, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 14, + "panels": [], + "repeat": null, + "title": "Service Status", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 6, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_[[Service]]_api{job=\"openstack-metrics\",region=\"$region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 13, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"[[Service]].*\", status_code=\"5xx\",region=\"$region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 16, + "x": 8, + "y": 1 + }, + "id": 7, + "interval": ">60s", + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(nginx_upstream_response_msecs_avg{upstream=~\"openstack-[[Service]].*\",region=\"$region\"}) by (upstream)", + "format": "time_series", + "intervalFactor": 2, + "refId": "A", + "step": 120 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "HTTP response time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 8 + }, + "id": 9, + "interval": "> 60s", + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_[[Service]]_api{region=\"$region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": false + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "{status_code=\"2xx\"}": "#629E51", + "{status_code=\"5xx\"}": "#BF1B00" + }, + "bars": true, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 16, + "x": 8, + "y": 8 + }, + "id": 8, + "interval": "> 60s", + "legend": { + "alignAsTable": false, + "avg": false, + "current": false, + "hideEmpty": false, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "total": false, + "values": false + }, + "lines": false, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(nginx_responses_total{server_zone=~\"[[Service]].*\",region=\"$region\"}) by (status_code)", + "format": "time_series", + "intervalFactor": 2, + "refId": "A", + "step": 120 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Number of HTTP responses", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "prometheus", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + "tags": [], + "text": "cinder", + "value": "cinder" + }, + "hide": 0, + "includeAll": false, + "label": null, + "multi": false, + "name": "Service", + "options": [ + { + "selected": false, + "text": "nova", + "value": "nova" + }, + { + "selected": false, + "text": "glance", + "value": "glance" + }, + { + "selected": false, + "text": "keystone", + "value": "keystone" + }, + { + "selected": true, + "text": "cinder", + "value": "cinder" + }, + { + "selected": false, + "text": "heat", + "value": "heat" + }, + { + "selected": false, + "text": "placement", + "value": "placement" + }, + { + "selected": false, + "text": "neutron", + "value": "neutron" + } + ], + "query": "nova,glance,keystone,cinder,heat,placement,neutron", + "skipUrlSync": false, + "type": "custom" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "collapse": false, + "enable": true, + "notice": false, + "now": true, + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "status": "Stable", + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ], + "type": "timepicker" + }, + "timezone": "browser", + "title": "Openstack Service", + "version": 1 + } \ No newline at end of file diff --git a/grafana/values_overrides/persistentvolume.yaml b/grafana/values_overrides/persistentvolume.yaml new file mode 100644 index 000000000..6eb99018a --- /dev/null +++ b/grafana/values_overrides/persistentvolume.yaml @@ -0,0 +1,551 @@ +# This overrides file provides a raw json file for a dashboard for +# the etcd +conf: + dashboards: + persistent_volume: |- + { + "__inputs": [ + { + "name": "prometheus", + "label": "Prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + } + ], + "annotations": { + "list": [ + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "hideControls": false, + "id": null, + "links": [ + ], + "refresh": "", + "rows": [ + { + "collapse": false, + "collapsed": false, + "panels": [ + { + "aliasColors": { + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$datasource", + "fill": 1, + "gridPos": { + }, + "id": 2, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [ + ], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "repeat": null, + "seriesOverrides": [ + ], + "spaceLength": 10, + "span": 9, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "(\n sum without(instance, node) (kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n -\n sum without(instance, node) (kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n)\n", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Used Space", + "refId": "A" + }, + { + "expr": "sum without(instance, node) (kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Free Space", + "refId": "B" + } + ], + "thresholds": [ + ], + "timeFrom": null, + "timeShift": null, + "title": "Volume Space Usage", + "tooltip": { + "shared": false, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [ + ] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ] + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "$datasource", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + }, + "id": 3, + "interval": null, + "links": [ + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "span": 3, + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(\n kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n -\n kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n)\n/\nkubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n* 100\n", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "80, 90", + "title": "Volume Space Usage", + "tooltip": { + "shared": false + }, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + } + ], + "repeat": null, + "repeatIteration": null, + "repeatRowId": null, + "showTitle": false, + "title": "Dashboard Row", + "titleSize": "h6", + "type": "row" + }, + { + "collapse": false, + "collapsed": false, + "panels": [ + { + "aliasColors": { + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$datasource", + "fill": 1, + "gridPos": { + }, + "id": 4, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [ + ], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "repeat": null, + "seriesOverrides": [ + ], + "spaceLength": 10, + "span": 9, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum without(instance, node) (kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Used inodes", + "refId": "A" + }, + { + "expr": "(\n sum without(instance, node) (kubelet_volume_stats_inodes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n -\n sum without(instance, node) (kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n)\n", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": " Free inodes", + "refId": "B" + } + ], + "thresholds": [ + ], + "timeFrom": null, + "timeShift": null, + "title": "Volume inodes Usage", + "tooltip": { + "shared": false, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [ + ] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ] + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "$datasource", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + }, + "id": 5, + "interval": null, + "links": [ + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "span": 3, + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n/\nkubelet_volume_stats_inodes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n* 100\n", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "80, 90", + "title": "Volume inodes Usage", + "tooltip": { + "shared": false + }, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + } + ], + "repeat": null, + "repeatIteration": null, + "repeatRowId": null, + "showTitle": false, + "title": "Dashboard Row", + "titleSize": "h6", + "type": "row" + } + ], + "schemaVersion": 14, + "style": "dark", + "tags": [ + "kubernetes-mixin" + ], + "templating": { + "list": [ + { + "current": { + "text": "Prometheus", + "value": "Prometheus" + }, + "hide": 0, + "label": null, + "name": "datasource", + "options": [ + ], + "query": "prometheus", + "refresh": 1, + "regex": "", + "type": "datasource" + }, + { + "allValue": null, + "current": { + }, + "datasource": "$datasource", + "hide": 2, + "includeAll": false, + "label": "cluster", + "multi": false, + "name": "cluster", + "options": [ + ], + "query": "label_values(kubelet_volume_stats_capacity_bytes, cluster)", + "refresh": 2, + "regex": "", + "sort": 1, + "tagValuesQuery": "", + "tags": [ + ], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + }, + "datasource": "$datasource", + "hide": 0, + "includeAll": false, + "label": "Namespace", + "multi": false, + "name": "namespace", + "options": [ + ], + "query": "label_values(kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"kubelet\"}, namespace)", + "refresh": 2, + "regex": "", + "sort": 1, + "tagValuesQuery": "", + "tags": [ + ], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + }, + "datasource": "$datasource", + "hide": 0, + "includeAll": false, + "label": "PersistentVolumeClaim", + "multi": false, + "name": "volume", + "options": [ + ], + "query": "label_values(kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"kubelet\", namespace=\"$namespace\"}, persistentvolumeclaim)", + "refresh": 2, + "regex": "", + "sort": 1, + "tagValuesQuery": "", + "tags": [ + ], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "", + "title": "Persistent Volumes", + "version": 0 + } \ No newline at end of file diff --git a/grafana/values_overrides/prometheus.yaml b/grafana/values_overrides/prometheus.yaml index d1aa99eac..73a8551ee 100644 --- a/grafana/values_overrides/prometheus.yaml +++ b/grafana/values_overrides/prometheus.yaml @@ -2,2794 +2,3706 @@ # Prometheus conf: dashboards: - prometheus: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: Prometheus which you want to monitor - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.6.0 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: panel - id: text - name: Text - version: '' - annotations: - list: - - builtIn: 1 - datasource: "-- Grafana --" - enable: true - hide: true - iconColor: rgba(0, 211, 255, 1) - name: Annotations & Alerts - type: dashboard - - datasource: "${DS_PROMETHEUS}" - enable: true - expr: count(sum(up{instance="$instance"}) by (instance) < 1) - hide: false - iconColor: rgb(250, 44, 18) - limit: 100 - name: downage - showIn: 0 - step: 30s - tagKeys: instance - textFormat: prometheus down - titleFormat: Downage - type: alert - - datasource: "${DS_PROMETHEUS}" - enable: true - expr: sum(changes(prometheus_config_last_reload_success_timestamp_seconds[10m])) - by (instance) - hide: false - iconColor: "#fceaca" - limit: 100 - name: Reload - showIn: 0 - step: 5m - tagKeys: instance - tags: [] - titleFormat: Reload - type: tags - description: Dashboard for monitoring of Prometheus v2.x.x - editable: true - gnetId: 3681 - graphTooltip: 1 - hideControls: false - id: - links: - - icon: info - tags: [] - targetBlank: true - title: 'Dashboard''s Github ' - tooltip: Github repo of this dashboard - type: link - url: https://github.com/FUSAKLA/Prometheus2-grafana-dashboard - - icon: doc - tags: [] - targetBlank: true - title: Prometheus Docs - tooltip: '' - type: link - url: http://prometheus.io/docs/introduction/overview/ - refresh: 5m - rows: - - collapse: false - height: 161 - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - "#299c46" - - rgba(237, 129, 40, 0.89) - - "#bf1b00" - datasource: "${DS_PROMETHEUS}" - decimals: 1 - format: s - gauge: - maxValue: 1000000 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 41 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: time() - process_start_time_seconds{instance="$instance"} - format: time_series - instant: false - intervalFactor: 2 - refId: A - thresholds: '' - title: Uptime - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - "#299c46" - - rgba(237, 129, 40, 0.89) - - "#bf1b00" - datasource: "${DS_PROMETHEUS}" - format: short - gauge: - maxValue: 1000000 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 42 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: prometheus_tsdb_head_series{instance="$instance"} - format: time_series - instant: false - intervalFactor: 2 - refId: A - thresholds: '500000,800000,1000000' - title: Total count of time series - type: singlestat - valueFontSize: 150% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - "#299c46" - - rgba(237, 129, 40, 0.89) - - "#d44a3a" - datasource: "${DS_PROMETHEUS}" - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 48 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: version - targets: - - expr: prometheus_build_info{instance="$instance"} - format: table - instant: true - intervalFactor: 2 - refId: A - thresholds: '' - title: Version - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - "#299c46" - - rgba(237, 129, 40, 0.89) - - "#d44a3a" - datasource: "${DS_PROMETHEUS}" - decimals: 2 - format: ms - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 49 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: prometheus_tsdb_head_max_time{instance="$instance"} - prometheus_tsdb_head_min_time{instance="$instance"} - format: time_series - instant: true - intervalFactor: 2 - refId: A - thresholds: '' - title: Actual head block length - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - content: - height: '' - id: 50 - links: [] - mode: html - span: 1 - title: '' - transparent: true - type: text - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - "#e6522c" - - rgba(237, 129, 40, 0.89) - - "#299c46" - datasource: "${DS_PROMETHEUS}" - decimals: 1 - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 52 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: '2' - format: time_series - intervalFactor: 2 - refId: A - thresholds: '10,20' - title: '' - transparent: true - type: singlestat - valueFontSize: 200% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Header instance info - titleSize: h6 - - collapse: false - height: '250' - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 15 - legend: - avg: true - current: false - max: false - min: false - show: false - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: true - steppedLine: false - targets: - - expr: max(prometheus_engine_query_duration_seconds{instance="$instance"}) by - (instance, slice) - format: time_series - intervalFactor: 1 - legendFormat: max duration for {{slice}} - metric: prometheus_local_storage_rushed_mode - refId: A - step: 900 - thresholds: [] - timeFrom: - timeShift: - title: Query elapsed time - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: '' - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 17 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_tsdb_head_series_created_total{instance="$instance"}[$aggregation_interval])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: created on {{ instance }} - metric: prometheus_local_storage_maintain_series_duration_seconds_count - refId: A - step: 1800 - - expr: sum(increase(prometheus_tsdb_head_series_removed_total{instance="$instance"}[$aggregation_interval])) - by (instance) * -1 - format: time_series - intervalFactor: 2 - legendFormat: removed on {{ instance }} - refId: B - thresholds: [] - timeFrom: - timeShift: - title: Head series created/deleted - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 13 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_target_scrapes_exceeded_sample_limit_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: exceeded_sample_limit on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: A - step: 1800 - - expr: sum(increase(prometheus_target_scrapes_sample_duplicate_timestamp_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: duplicate_timestamp on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: B - step: 1800 - - expr: sum(increase(prometheus_target_scrapes_sample_out_of_bounds_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: out_of_bounds on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: C - step: 1800 - - expr: sum(increase(prometheus_target_scrapes_sample_out_of_order_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: out_of_order on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: D - step: 1800 - - expr: sum(increase(prometheus_rule_evaluation_failures_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: rule_evaluation_failure on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: G - step: 1800 - - expr: sum(increase(prometheus_tsdb_compactions_failed_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: tsdb_compactions_failed on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: K - step: 1800 - - expr: sum(increase(prometheus_tsdb_reloads_failures_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: tsdb_reloads_failures on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: L - step: 1800 - - expr: sum(increase(prometheus_tsdb_head_series_not_found{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: head_series_not_found on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: N - step: 1800 - - expr: sum(increase(prometheus_evaluator_iterations_missed_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: evaluator_iterations_missed on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: O - step: 1800 - - expr: sum(increase(prometheus_evaluator_iterations_skipped_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: evaluator_iterations_skipped on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: P - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Prometheus errors - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Main info - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - description: '' - editable: true - error: false - fill: 1 - grid: {} - id: 25 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: false - show: false - sort: max - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: prometheus_target_interval_length_seconds{instance="$instance",quantile="0.99"} - - 60 - format: time_series - interval: 2m - intervalFactor: 1 - legendFormat: "{{instance}}" - metric: '' - refId: A - step: 300 - thresholds: [] - timeFrom: - timeShift: - title: Scrape delay (counts with 1m scrape interval) - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - logBase: 1 - max: - min: - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 14 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: Queue length - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_evaluator_duration_seconds{instance="$instance"}) by (instance, - quantile) - format: time_series - intervalFactor: 2 - legendFormat: Queue length - metric: prometheus_local_storage_indexing_queue_length - refId: B - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Rule evaulation duration - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Scrape & rule duration - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 18 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(http_requests_total{instance="$instance"}[$aggregation_interval])) - by (instance, handler) > 0 - format: time_series - intervalFactor: 2 - legendFormat: "{{ handler }} on {{ instance }}" - metric: '' - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Request count - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: none - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 16 - legend: - avg: false - current: false - hideEmpty: true - hideZero: true - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: max(sum(http_request_duration_microseconds{instance="$instance"}) by (instance, - handler, quantile)) by (instance, handler) > 0 - format: time_series - hide: false - intervalFactor: 2 - legendFormat: "{{ handler }} on {{ instance }}" - refId: B - thresholds: [] - timeFrom: - timeShift: - title: Request duration per handler - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: µs - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 19 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(http_request_size_bytes{instance="$instance", quantile="0.99"}[$aggregation_interval])) - by (instance, handler) > 0 - format: time_series - hide: false - intervalFactor: 2 - legendFormat: "{{ handler }} in {{ instance }}" - refId: B - thresholds: [] - timeFrom: - timeShift: - title: Request size by handler - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Allocated bytes: "#F9BA8F" - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max count collector: "#bf1b00" - Max count harvester: "#bf1b00" - Max to persist: "#3F6833" - RSS: "#890F02" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 8 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/Max.*/" - fill: 0 - linewidth: 2 - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_engine_queries{instance="$instance"}) by (instance, handler) - format: time_series - intervalFactor: 2 - legendFormat: 'Current count ' - metric: last - refId: A - step: 1800 - - expr: sum(prometheus_engine_queries_concurrent_max{instance="$instance"}) by - (instance, handler) - format: time_series - intervalFactor: 2 - legendFormat: Max count - metric: last - refId: B - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Cont of concurent queries - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Requests & queries - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Alert queue capacity on o collector: "#bf1b00" - Alert queue capacity on o harvester: "#bf1b00" - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 20 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/.*capacity.*/" - fill: 0 - linewidth: 2 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_notifications_queue_capacity{instance="$instance"})by (instance) - format: time_series - intervalFactor: 2 - legendFormat: 'Alert queue capacity ' - metric: prometheus_local_storage_checkpoint_last_size_bytes - refId: A - step: 1800 - - expr: sum(prometheus_notifications_queue_length{instance="$instance"})by (instance) - format: time_series - intervalFactor: 2 - legendFormat: 'Alert queue size on ' - metric: prometheus_local_storage_checkpoint_last_size_bytes - refId: B - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Alert queue size - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 21 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_notifications_alertmanagers_discovered{instance="$instance"}) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: Checkpoint chunks written/s - metric: prometheus_local_storage_checkpoint_series_chunks_written_sum - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Count of discovered alertmanagers - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: none - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 39 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_notifications_dropped_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: notifications_dropped on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: F - step: 1800 - - expr: sum(increase(prometheus_rule_evaluation_failures_total{rule_type="alerting",instance="$instance"}[$aggregation_interval])) - by (rule_type,instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: rule_evaluation_failures on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Alerting errors - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Alerting - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 45 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: increase(prometheus_target_sync_length_seconds_count{scrape_job="kubernetes-service-endpoints"}[$aggregation_interval]) - format: time_series - intervalFactor: 2 - legendFormat: Count of target synces - refId: A - step: 240 - thresholds: [] - timeFrom: - timeShift: - title: Kubernetes SD sync count - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 46 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_target_scrapes_exceeded_sample_limit_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: exceeded_sample_limit on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: A - step: 1800 - - expr: sum(increase(prometheus_sd_file_read_errors_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: sd_file_read_error on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: E - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Service discovery errors - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Service discovery - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 36 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_tsdb_reloads_total{instance="$instance"}[30m])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: "{{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: Reloaded block from disk - tooltip: - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 5 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_tsdb_blocks_loaded{instance="$instance"}) by (instance) - format: time_series - intervalFactor: 2 - legendFormat: Loaded data blocks - metric: prometheus_local_storage_memory_chunkdescs - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Loaded data blocks - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: prometheus_tsdb_head_series{instance="$instance"} - format: time_series - intervalFactor: 2 - legendFormat: Time series count - metric: prometheus_local_storage_memory_series - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Time series total count - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 1 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(rate(prometheus_tsdb_head_samples_appended_total{instance="$instance"}[$aggregation_interval])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: samples/s {{instance}} - metric: prometheus_local_storage_ingested_samples_total - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Samples Appended per second - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: '' - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: TSDB stats - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - To persist: "#9AC48A" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 2 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/Max.*/" - fill: 0 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_tsdb_head_chunks{instance="$instance"}) by (instance) - format: time_series - hide: false - intervalFactor: 2 - legendFormat: Head chunk count - metric: prometheus_local_storage_memory_chunks - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Head chunks count - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 35 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: max(prometheus_tsdb_head_max_time{instance="$instance"}) by (instance) - - min(prometheus_tsdb_head_min_time{instance="$instance"}) by (instance) - format: time_series - intervalFactor: 2 - legendFormat: "{{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: Length of head block - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: ms - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 4 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(prometheus_tsdb_head_chunks_created_total{instance="$instance"}[$aggregation_interval])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: created on {{ instance }} - refId: B - - expr: sum(rate(prometheus_tsdb_head_chunks_removed_total{instance="$instance"}[$aggregation_interval])) - by (instance) * -1 - format: time_series - intervalFactor: 2 - legendFormat: deleted on {{ instance }} - refId: C - thresholds: [] - timeFrom: - timeShift: - title: Head Chunks Created/Deleted per second - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Head block stats - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 33 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_tsdb_compaction_duration_sum{instance="$instance"}[30m]) - / increase(prometheus_tsdb_compaction_duration_count{instance="$instance"}[30m])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: "{{ instance }}" - refId: B - thresholds: [] - timeFrom: - timeShift: - title: Compaction duration - tooltip: - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 34 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_tsdb_head_gc_duration_seconds{instance="$instance"}) by - (instance, quantile) - format: time_series - intervalFactor: 2 - legendFormat: "{{ quantile }} on {{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: Go Garbage collection duration - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 37 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_tsdb_wal_truncate_duration_seconds{instance="$instance"}) - by (instance, quantile) - format: time_series - intervalFactor: 2 - legendFormat: "{{ quantile }} on {{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: WAL truncate duration seconds - tooltip: - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 38 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(tsdb_wal_fsync_duration_seconds{instance="$instance"}) by (instance, - quantile) - format: time_series - intervalFactor: 2 - legendFormat: "{{ quantile }} {{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: WAL fsync duration seconds - tooltip: - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Data maintenance - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Allocated bytes: "#7EB26D" - Allocated bytes - 1m max: "#BF1B00" - Allocated bytes - 1m min: "#BF1B00" - Allocated bytes - 5m max: "#BF1B00" - Allocated bytes - 5m min: "#BF1B00" - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - RSS: "#447EBC" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - decimals: - editable: true - error: false - fill: 1 - id: 6 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/-/" - fill: 0 - - alias: collector heap size - color: "#E0752D" - fill: 0 - linewidth: 2 - - alias: collector kubernetes memory limit - color: "#BF1B00" - fill: 0 - linewidth: 3 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(process_resident_memory_bytes{instance="$instance"}) by (instance) - format: time_series - hide: false - intervalFactor: 2 - legendFormat: Total resident memory - {{instance}} - metric: process_resident_memory_bytes - refId: B - step: 1800 - - expr: sum(go_memstats_alloc_bytes{instance="$instance"}) by (instance) - format: time_series - hide: false - intervalFactor: 2 - legendFormat: Total llocated bytes - {{instance}} - metric: go_memstats_alloc_bytes - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Memory - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Allocated bytes: "#F9BA8F" - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - RSS: "#890F02" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 7 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: rate(go_memstats_alloc_bytes_total{instance="$instance"}[$aggregation_interval]) - format: time_series - intervalFactor: 2 - legendFormat: Allocated Bytes/s - metric: go_memstats_alloc_bytes - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Allocations per second - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - id: 9 - legend: - alignAsTable: false - avg: false - current: false - hideEmpty: false - max: false - min: false - rightSide: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(process_cpu_seconds_total{instance="$instance"}[$aggregation_interval])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: CPU/s - metric: prometheus_local_storage_ingested_samples_total - refId: B - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: CPU per second - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: - - avg - yaxes: - - format: none - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: RAM&CPU - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 47 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum(increase(net_conntrack_dialer_conn_failed_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - hide: false - interval: '' - intervalFactor: 2 - legendFormat: conntrack_dialer_conn_failed on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: M - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Net errors - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Contrac errors - titleSize: h6 - schemaVersion: 14 - style: dark - tags: - - prometheus - templating: - list: - - auto: true - auto_count: 30 - auto_min: 2m - current: - text: auto - value: "$__auto_interval" - hide: 0 - label: aggregation intarval - name: aggregation_interval - options: - - selected: true - text: auto - value: "$__auto_interval" - - selected: false - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 2 - type: interval - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Instance - multi: false - name: instance - options: [] - query: label_values(prometheus_build_info, instance) - refresh: 2 - regex: '' - sort: 2 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: - text: influxdb(heapster) - kokura - value: influxdb(heapster) - kokura - hide: 0 - label: InfluxDB datasource - name: influx_datasource - options: [] - query: influxdb - refresh: 1 - regex: '' - type: datasource - time: - from: now-7d - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Prometheus2.0 (v1.0.0 by FUSAKLA) - version: 8 + prometheus: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "Prometheus which you want to monitor", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "4.6.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + }, + { + "type": "panel", + "id": "text", + "name": "Text", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + }, + { + "datasource": "${DS_PROMETHEUS}", + "enable": true, + "expr": "count(sum(up{instance=\"$instance\"}) by (instance) < 1)", + "hide": false, + "iconColor": "rgb(250, 44, 18)", + "limit": 100, + "name": "downage", + "showIn": 0, + "step": "30s", + "tagKeys": "instance", + "textFormat": "prometheus down", + "titleFormat": "Downage", + "type": "alert" + }, + { + "datasource": "${DS_PROMETHEUS}", + "enable": true, + "expr": "sum(changes(prometheus_config_last_reload_success_timestamp_seconds[10m])) by (instance)", + "hide": false, + "iconColor": "#fceaca", + "limit": 100, + "name": "Reload", + "showIn": 0, + "step": "5m", + "tagKeys": "instance", + "tags": [], + "titleFormat": "Reload", + "type": "tags" + } + ] + }, + "description": "Dashboard for monitoring of Prometheus v2.x.x", + "overwrite": true, + "editable": false, + "gnetId": 3681, + "graphTooltip": 1, + "id": 41, + "links": [ + { + "icon": "info", + "tags": [], + "targetBlank": true, + "title": "Dashboard's Github ", + "tooltip": "Github repo of this dashboard", + "type": "link", + "url": "https://github.com/FUSAKLA/Prometheus2-grafana-dashboard" + }, + { + "icon": "doc", + "tags": [], + "targetBlank": true, + "title": "Prometheus Docs", + "tooltip": "", + "type": "link", + "url": "http://prometheus.io/docs/introduction/overview/" + } + ], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 53, + "panels": [], + "repeat": null, + "title": "Header instance info", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#bf1b00" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 1, + "format": "s", + "gauge": { + "maxValue": 1000000, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 41, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "time() - process_start_time_seconds{instance=\"$instance\"}", + "format": "time_series", + "instant": false, + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "", + "title": "Uptime", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#bf1b00" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "short", + "gauge": { + "maxValue": 1000000, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 8, + "x": 4, + "y": 1 + }, + "id": 42, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "prometheus_tsdb_head_series{instance=\"$instance\"}", + "format": "time_series", + "instant": false, + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "500000,800000,1000000", + "title": "Total count of time series", + "type": "singlestat", + "valueFontSize": "150%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 4, + "x": 12, + "y": 1 + }, + "id": 48, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "version", + "targets": [ + { + "expr": "prometheus_build_info{instance=\"$instance\"}", + "format": "table", + "instant": true, + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "", + "title": "Version", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "format": "ms", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 4, + "x": 16, + "y": 1 + }, + "id": 49, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "prometheus_tsdb_head_max_time{instance=\"$instance\"} - prometheus_tsdb_head_min_time{instance=\"$instance\"}", + "format": "time_series", + "instant": true, + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "", + "title": "Actual head block length", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "content": "", + "gridPos": { + "h": 5, + "w": 2, + "x": 20, + "y": 1 + }, + "height": "", + "id": 50, + "links": [], + "mode": "html", + "options": {}, + "title": "", + "transparent": true, + "type": "text" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "#e6522c", + "rgba(237, 129, 40, 0.89)", + "#299c46" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 1, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 2, + "x": 22, + "y": 1 + }, + "id": 52, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "2", + "format": "time_series", + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "10,20", + "title": "", + "transparent": true, + "type": "singlestat", + "valueFontSize": "200%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 6 + }, + "id": 54, + "panels": [], + "repeat": null, + "title": "Main info", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 7 + }, + "id": 15, + "legend": { + "avg": true, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "max(prometheus_engine_query_duration_seconds{instance=\"$instance\"}) by (instance, slice)", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "max duration for {{slice}}", + "metric": "prometheus_local_storage_rushed_mode", + "refId": "A", + "step": 900 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Query elapsed time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": "", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 7 + }, + "id": 17, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(prometheus_tsdb_head_series_created_total{instance=\"$instance\"}[$aggregation_interval])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "created on {{ instance }}", + "metric": "prometheus_local_storage_maintain_series_duration_seconds_count", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_tsdb_head_series_removed_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) * -1", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "removed on {{ instance }}", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Head series created/deleted", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 7 + }, + "id": 13, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(prometheus_target_scrapes_exceeded_sample_limit_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "exceeded_sample_limit on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_target_scrapes_sample_duplicate_timestamp_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "duplicate_timestamp on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "B", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_target_scrapes_sample_out_of_bounds_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "out_of_bounds on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "C", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_target_scrapes_sample_out_of_order_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "out_of_order on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "D", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_rule_evaluation_failures_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "rule_evaluation_failure on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "G", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_tsdb_compactions_failed_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "tsdb_compactions_failed on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "K", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_tsdb_reloads_failures_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "tsdb_reloads_failures on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "L", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_tsdb_head_series_not_found{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "head_series_not_found on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "E", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_evaluator_iterations_missed_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "evaluator_iterations_missed on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "O", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_evaluator_iterations_skipped_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "evaluator_iterations_skipped on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "P", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Prometheus errors", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 14 + }, + "id": 55, + "panels": [], + "repeat": null, + "title": "Scrape & rule duration", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "description": "", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 15 + }, + "id": 25, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "show": false, + "sort": "max", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "prometheus_target_interval_length_seconds{instance=\"$instance\",quantile=\"0.99\"} - 60", + "format": "time_series", + "interval": "2m", + "intervalFactor": 1, + "legendFormat": "{{instance}}", + "metric": "", + "refId": "A", + "step": 300 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Scrape delay (counts with 1m scrape interval)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 15 + }, + "id": 14, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "Queue length", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_evaluator_duration_seconds{instance=\"$instance\"}) by (instance, quantile)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Queue length", + "metric": "prometheus_local_storage_indexing_queue_length", + "refId": "B", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Rule evaulation duration", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 22 + }, + "id": 56, + "panels": [], + "repeat": null, + "title": "Requests & queries", + "type": "row" + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 23 + }, + "id": 18, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(http_requests_total{instance=\"$instance\"}[$aggregation_interval])) by (instance, handler) > 0", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ handler }} on {{ instance }}", + "metric": "", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Request count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 23 + }, + "id": 16, + "legend": { + "avg": false, + "current": false, + "hideEmpty": true, + "hideZero": true, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "max(sum(http_request_duration_microseconds{instance=\"$instance\"}) by (instance, handler, quantile)) by (instance, handler) > 0", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{ handler }} on {{ instance }}", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Request duration per handler", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "µs", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 23 + }, + "id": 19, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(http_request_size_bytes{instance=\"$instance\", quantile=\"0.99\"}[$aggregation_interval])) by (instance, handler) > 0", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{ handler }} in {{ instance }}", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Request size by handler", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Allocated bytes": "#F9BA8F", + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max count collector": "#bf1b00", + "Max count harvester": "#bf1b00", + "Max to persist": "#3F6833", + "RSS": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 23 + }, + "id": 8, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/Max.*/", + "fill": 0, + "linewidth": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_engine_queries{instance=\"$instance\"}) by (instance, handler)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Current count ", + "metric": "last", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum(prometheus_engine_queries_concurrent_max{instance=\"$instance\"}) by (instance, handler)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Max count", + "metric": "last", + "refId": "B", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cont of concurent queries", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 30 + }, + "id": 57, + "panels": [], + "repeat": null, + "title": "Alerting", + "type": "row" + }, + { + "aliasColors": { + "Alert queue capacity on o collector": "#bf1b00", + "Alert queue capacity on o harvester": "#bf1b00", + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 31 + }, + "id": 20, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/.*capacity.*/", + "fill": 0, + "linewidth": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_notifications_queue_capacity{instance=\"$instance\"})by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Alert queue capacity ", + "metric": "prometheus_local_storage_checkpoint_last_size_bytes", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum(prometheus_notifications_queue_length{instance=\"$instance\"})by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Alert queue size on ", + "metric": "prometheus_local_storage_checkpoint_last_size_bytes", + "refId": "B", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Alert queue size", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 31 + }, + "id": 21, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_notifications_alertmanagers_discovered{instance=\"$instance\"}) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Checkpoint chunks written/s", + "metric": "prometheus_local_storage_checkpoint_series_chunks_written_sum", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Count of discovered alertmanagers", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 31 + }, + "id": 39, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(prometheus_notifications_dropped_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "notifications_dropped on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "F", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_rule_evaluation_failures_total{rule_type=\"alerting\",instance=\"$instance\"}[$aggregation_interval])) by (rule_type,instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "rule_evaluation_failures on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Alerting errors", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 38 + }, + "id": 58, + "panels": [], + "repeat": null, + "title": "Service discovery", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 39 + }, + "id": 45, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "increase(prometheus_target_sync_length_seconds_count{scrape_job=\"kubernetes-service-endpoints\"}[$aggregation_interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Count of target synces", + "refId": "A", + "step": 240 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Kubernetes SD sync count", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 39 + }, + "id": 46, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(prometheus_target_scrapes_exceeded_sample_limit_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "exceeded_sample_limit on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum(increase(prometheus_sd_file_read_errors_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "sd_file_read_error on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "E", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Service discovery errors", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 46 + }, + "id": 59, + "panels": [], + "repeat": null, + "title": "TSDB stats", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 47 + }, + "id": 36, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(prometheus_tsdb_reloads_total{instance=\"$instance\"}[30m])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Reloaded block from disk", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 47 + }, + "id": 5, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_blocks_loaded{instance=\"$instance\"}) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Loaded data blocks", + "metric": "prometheus_local_storage_memory_chunkdescs", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Loaded data blocks", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 47 + }, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "prometheus_tsdb_head_series{instance=\"$instance\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Time series count", + "metric": "prometheus_local_storage_memory_series", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Time series total count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 47 + }, + "id": 1, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(prometheus_tsdb_head_samples_appended_total{instance=\"$instance\"}[$aggregation_interval])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "samples/s {{instance}}", + "metric": "prometheus_local_storage_ingested_samples_total", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Samples Appended per second", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 54 + }, + "id": 60, + "panels": [], + "repeat": null, + "title": "Head block stats", + "type": "row" + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833", + "To persist": "#9AC48A" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 55 + }, + "id": 2, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/Max.*/", + "fill": 0 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_head_chunks{instance=\"$instance\"}) by (instance)", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "Head chunk count", + "metric": "prometheus_local_storage_memory_chunks", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Head chunks count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 55 + }, + "id": 35, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "max(prometheus_tsdb_head_max_time{instance=\"$instance\"}) by (instance) - min(prometheus_tsdb_head_min_time{instance=\"$instance\"}) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Length of head block", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 55 + }, + "id": 4, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(prometheus_tsdb_head_chunks_created_total{instance=\"$instance\"}[$aggregation_interval])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "created on {{ instance }}", + "refId": "B" + }, + { + "expr": "sum(rate(prometheus_tsdb_head_chunks_removed_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) * -1", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "deleted on {{ instance }}", + "refId": "C" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Head Chunks Created/Deleted per second", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 62 + }, + "id": 61, + "panels": [], + "repeat": null, + "title": "Data maintenance", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 63 + }, + "id": 33, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(prometheus_tsdb_compaction_duration_sum{instance=\"$instance\"}[30m]) / increase(prometheus_tsdb_compaction_duration_count{instance=\"$instance\"}[30m])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ instance }}", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Compaction duration", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 63 + }, + "id": 34, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_head_gc_duration_seconds{instance=\"$instance\"}) by (instance, quantile)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ quantile }} on {{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Go Garbage collection duration", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 63 + }, + "id": 37, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_wal_truncate_duration_seconds{instance=\"$instance\"}) by (instance, quantile)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ quantile }} on {{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "WAL truncate duration seconds", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 63 + }, + "id": 38, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(tsdb_wal_fsync_duration_seconds{instance=\"$instance\"}) by (instance, quantile)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ quantile }} {{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "WAL fsync duration seconds", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 70 + }, + "id": 62, + "panels": [], + "repeat": null, + "title": "RAM&CPU", + "type": "row" + }, + { + "aliasColors": { + "Allocated bytes": "#7EB26D", + "Allocated bytes - 1m max": "#BF1B00", + "Allocated bytes - 1m min": "#BF1B00", + "Allocated bytes - 5m max": "#BF1B00", + "Allocated bytes - 5m min": "#BF1B00", + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833", + "RSS": "#447EBC" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 71 + }, + "id": 6, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/-/", + "fill": 0 + }, + { + "alias": "collector heap size", + "color": "#E0752D", + "fill": 0, + "linewidth": 2 + }, + { + "alias": "collector kubernetes memory limit", + "color": "#BF1B00", + "fill": 0, + "linewidth": 3 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(process_resident_memory_bytes{instance=\"$instance\"}) by (instance)", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "Total resident memory - {{instance}}", + "metric": "process_resident_memory_bytes", + "refId": "B", + "step": 1800 + }, + { + "expr": "sum(go_memstats_alloc_bytes{instance=\"$instance\"}) by (instance)", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "Total llocated bytes - {{instance}}", + "metric": "go_memstats_alloc_bytes", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Memory", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": { + "Allocated bytes": "#F9BA8F", + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833", + "RSS": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 71 + }, + "id": 7, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(go_memstats_alloc_bytes_total{instance=\"$instance\"}[$aggregation_interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Allocated Bytes/s", + "metric": "go_memstats_alloc_bytes", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Allocations per second", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 71 + }, + "id": 9, + "legend": { + "alignAsTable": false, + "avg": false, + "current": false, + "hideEmpty": false, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(process_cpu_seconds_total{instance=\"$instance\"}[$aggregation_interval])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "CPU/s", + "metric": "prometheus_local_storage_ingested_samples_total", + "refId": "B", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "CPU per second", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [ + "avg" + ] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 78 + }, + "id": 63, + "panels": [], + "repeat": null, + "title": "Contrac errors", + "type": "row" + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 79 + }, + "id": 47, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(net_conntrack_dialer_conn_failed_total{instance=\"$instance\"}[$aggregation_interval])) by (instance) > 0", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "conntrack_dialer_conn_failed on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "M", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Net errors", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ] + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "prometheus" + ], + "templating": { + "list": [ + { + "auto": true, + "auto_count": 30, + "auto_min": "2m", + "current": { + "text": "auto", + "value": "$__auto_interval_aggregation_interval" + }, + "hide": 0, + "label": "aggregation intarval", + "name": "aggregation_interval", + "options": [ + { + "selected": true, + "text": "auto", + "value": "$__auto_interval_aggregation_interval" + }, + { + "selected": false, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Instance", + "multi": false, + "name": "instance", + "options": [], + "query": "label_values(prometheus_build_info, instance)", + "refresh": 2, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "current": { + "text": "No data sources found", + "value": "" + }, + "hide": 0, + "includeAll": false, + "label": "InfluxDB datasource", + "multi": false, + "name": "influx_datasource", + "options": [], + "query": "influxdb", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Prometheus2.0 (v1.0.0 by FUSAKLA)", + "version": 1 + } \ No newline at end of file diff --git a/tools/deployment/osh-infra-monitoring/110-grafana.sh b/tools/deployment/osh-infra-monitoring/110-grafana.sh index 8e91458b0..9675f573a 100755 --- a/tools/deployment/osh-infra-monitoring/110-grafana.sh +++ b/tools/deployment/osh-infra-monitoring/110-grafana.sh @@ -19,7 +19,7 @@ set -xe #NOTE: Lint and package chart make grafana -FEATURE_GATES="calico,ceph,containers,coredns,elasticsearch,kubernetes,nginx,nodes,openstack,prometheus,home_dashboard,apparmor" +FEATURE_GATES="calico,ceph,containers,coredns,elasticsearch,kubernetes,nginx,nodes,openstack,prometheus,home_dashboard,persistentvolume,apparmor" : ${OSH_INFRA_EXTRA_HELM_ARGS_GRAFANA:="$({ ./tools/deployment/common/get-values-overrides.sh grafana;} 2> /dev/null)"} #NOTE: Deploy command