diff --git a/doc/source/conf.py b/doc/source/conf.py
index a30be6875..cb4d2f6cd 100644
--- a/doc/source/conf.py
+++ b/doc/source/conf.py
@@ -68,7 +68,7 @@ release = u'0.1.0'
#
# This is also used if you do content translation via gettext catalogs.
# Usually you set "language" from the command line for these cases.
-language = None
+language = 'en'
# List of patterns, relative to source directory, that match files and
# directories to ignore when looking for source files.
diff --git a/global/schemas/pegleg/AccountCatalogue/v1.yaml b/global/schemas/pegleg/AccountCatalogue/v1.yaml
index 681aed425..b7dacafc8 100644
--- a/global/schemas/pegleg/AccountCatalogue/v1.yaml
+++ b/global/schemas/pegleg/AccountCatalogue/v1.yaml
@@ -631,6 +631,11 @@ data:
properties:
username:
type: string
+ placement:
+ type: object
+ properties:
+ username:
+ type: string
oslo_db:
type: object
properties:
@@ -652,6 +657,44 @@ data:
type: string
database:
type: string
+ placement:
+ type: object
+ properties:
+ placement:
+ type: object
+ properties:
+ role:
+ type: string
+ region_name:
+ type: string
+ username:
+ type: string
+ project_name:
+ type: string
+ user_domain_name:
+ type: string
+ project_domain_name:
+ type: string
+ oslo_messaging:
+ type: object
+ properties:
+ admin:
+ type: object
+ properties:
+ username:
+ type: string
+ placement:
+ type: object
+ properties:
+ username:
+ type: string
+ oslo_db:
+ type: object
+ properties:
+ username:
+ type: string
+ database:
+ type: string
horizon:
type: object
properties:
diff --git a/global/software/charts/osh-infra/osh-infra-dashboards/grafana.yaml b/global/software/charts/osh-infra/osh-infra-dashboards/grafana.yaml
index 3961986ad..2c2dce691 100644
--- a/global/software/charts/osh-infra/osh-infra-dashboards/grafana.yaml
+++ b/global/software/charts/osh-infra/osh-infra-dashboards/grafana.yaml
@@ -305,17454 +305,40363 @@ data:
group_dn = "*"
org_role = "Viewer"
dashboards:
- calico:
- __inputs:
- - name: prometheus
- label: Prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 5.0.0
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- annotations:
- list:
- - builtIn: 1
- datasource: "-- Grafana --"
- enable: true
- hide: true
- iconColor: rgba(0, 211, 255, 1)
- name: Annotations & Alerts
- type: dashboard
- description: Calico cluster monitoring dashboard
- editable: false
- gnetId: 3244
- graphTooltip: 0
- id:
- links: []
- panels:
- - collapsed: false
- gridPos:
- h: 1
- w: 24
- x: 0
- 'y': 0
- id: 15
- panels: []
- repeat:
- title: Felix
- type: row
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 0
- 'y': 1
- id: 1
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_active_local_endpoints
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Active Local Endpoints
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 12
- 'y': 1
- id: 3
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_active_local_policies
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Active Local Policies
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 0
- 'y': 8
- id: 2
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_active_local_selectors
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Active Local Selectors
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 12
- 'y': 8
- id: 4
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_active_local_tags
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Active Local Tags
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 0
- 'y': 15
- id: 5
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_cluster_num_host_endpoints
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Cluster Host Endpoints
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 12
- 'y': 15
- id: 6
- legend:
- alignAsTable: true
- avg: false
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_cluster_num_workload_endpoints
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Cluster Workload Endpoints
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 0
- 'y': 22
- id: 7
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_cluster_num_hosts
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Clusters Hosts
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 12
- 'y': 22
- id: 8
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_ipsets_calico
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Active IP Sets
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 0
- 'y': 29
- id: 9
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_iptables_chains
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Active IP Tables Chains
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 12
- 'y': 29
- id: 10
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_ipset_errors
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: IP Set Command Failures
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 0
- 'y': 36
- id: 11
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_iptables_save_errors
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: IP Tables Save Errors
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 12
- 'y': 36
- id: 12
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_iptables_restore_errors
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: IP Tables Restore Errors
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 0
- 'y': 43
- id: 13
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_resyncs_started
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Felix Resyncing Datastore
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- gridPos:
- h: 7
- w: 12
- x: 12
- 'y': 43
- id: 14
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - expr: felix_int_dataplane_failures
- format: time_series
- intervalFactor: 2
- legendFormat: "{{instance}}"
- refId: A
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Dataplane failed updates
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- refresh: 5m
- schemaVersion: 16
- style: dark
- tags:
- - calico
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- time:
- from: now-1h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: utc
- title: Kubernetes Calico
- version: 2
- ceph_cluster:
- __inputs:
- - name: DS_PROMETHEUS
- label: Prometheus
- description: Prometheus.IO
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: grafana
- id: grafana
- name: Grafana
- version: 3.1.1
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- id:
- title: Ceph - Cluster
- tags:
- - ceph
- - cluster
- style: dark
- timezone: browser
- editable: true
- hideControls: false
- sharedCrosshair: false
- rows:
- - collapse: false
- editable: true
- height: 150px
- panels:
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 21
- interval: 1m
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: ceph_health_status{application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- refId: A
- step: 60
- thresholds: '1,1'
- title: Status
- transparent: false
- type: singlestat
- valueFontSize: 100%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- - op: "="
- text: HEALTHY
- value: '0'
- - op: "="
- text: WARNING
- value: '1'
- - op: "="
- text: CRITICAL
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 22
- interval: 1m
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- targets:
- - expr: count(ceph_pool_max_avail{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: ''
- title: Pools
- transparent: false
- type: singlestat
- valueFontSize: 100%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: bytes
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 33
- interval: 1m
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- targets:
- - expr: ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: 0.025,0.1
- title: Cluster Capacity
- transparent: false
- type: singlestat
- valueFontSize: 100%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: bytes
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 34
- interval: 1m
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- targets:
- - expr: ceph_cluster_total_used_bytes{application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: 0.025,0.1
- title: Used Capacity
- transparent: false
- type: singlestat
- valueFontSize: 100%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: percentunit
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 23
- interval: 1m
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: ceph_cluster_total_used_bytes/ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: '70,80'
- title: Current Utilization
- transparent: false
- type: singlestat
- valueFontSize: 100%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- title: New row
- - collapse: false
- editable: true
- height: 100px
- panels:
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 26
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum(ceph_osd_in{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: ''
- title: OSDs IN
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 40, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 27
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"}) - sum(ceph_osd_in{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: '1,1'
- title: OSDs OUT
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 28
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum(ceph_osd_up{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: ''
- title: OSDs UP
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 40, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 29
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"}) - sum(ceph_osd_up{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: '1,1'
- title: OSDs DOWN
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 30
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- targets:
- - expr: avg(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: '250,300'
- title: Average PGs per OSD
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- title: New row
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors:
- Available: "#EAB839"
- Total Capacity: "#447EBC"
- Used: "#BF1B00"
- total_avail: "#6ED0E0"
- total_space: "#7EB26D"
- total_used: "#890F02"
- bars: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 4
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- height: '300'
- id: 1
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 0
- links: []
- minSpan:
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: Total Capacity
- fill: 0
- linewidth: 3
- stack: false
- span: 4
- stack: true
- steppedLine: false
- targets:
- - expr: ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"} - ceph_cluster_total_used_bytes{application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Available
- refId: A
- step: 60
- - expr: ceph_cluster_total_used_bytes
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Used
- refId: B
- step: 60
- - expr: ceph_cluster_total_bytes
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Total Capacity
- refId: C
- step: 60
- timeFrom:
- timeShift:
- title: Capacity
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Total Capacity: "#7EB26D"
- Used: "#BF1B00"
- total_avail: "#6ED0E0"
- total_space: "#7EB26D"
- total_used: "#890F02"
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 0
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- thresholdLine: false
- height: '300'
- id: 3
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- minSpan:
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 4
- stack: true
- steppedLine: false
- targets:
- - expr: sum(ceph_osd_op_w{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Write
- refId: A
- step: 60
- - expr: sum(ceph_osd_op_r{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Read
- refId: B
- step: 60
- timeFrom:
- timeShift:
- title: IOPS
- tooltip:
- msResolution: true
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: none
- label: ''
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- height: '300'
- id: 7
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 4
- stack: true
- steppedLine: false
- targets:
- - expr: sum(ceph_osd_op_in_bytes{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Write
- refId: A
- step: 60
- - expr: sum(ceph_osd_op_out_bytes{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Read
- refId: B
- step: 60
- timeFrom:
- timeShift:
- title: Throughput
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: Bps
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- repeat:
- showTitle: true
- title: CLUSTER
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 18
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/^Total.*$/"
- stack: false
- span: 12
- stack: true
- steppedLine: false
- targets:
- - expr: ceph_cluster_total_objects{application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Total
- refId: A
- step: 60
- timeFrom:
- timeShift:
- title: Objects in the Cluster
- tooltip:
- msResolution: false
- shared: true
- sort: 1
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 19
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/^Total.*$/"
- stack: false
- span: 6
- stack: true
- steppedLine: false
- targets:
- - expr: sum(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Total
- refId: A
- step: 60
- - expr: sum(ceph_pg_active{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Active
- refId: B
- step: 60
- - expr: sum(ceph_pg_inconsistent{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Inconsistent
- refId: C
- step: 60
- - expr: sum(ceph_pg_creating{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Creating
- refId: D
- step: 60
- - expr: sum(ceph_pg_recovering{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Recovering
- refId: E
- step: 60
- - expr: sum(ceph_pg_down{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Down
- refId: F
- step: 60
- timeFrom:
- timeShift:
- title: PGs
- tooltip:
- msResolution: false
- shared: true
- sort: 1
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 20
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/^Total.*$/"
- stack: false
- span: 6
- stack: true
- steppedLine: false
- targets:
- - expr: sum(ceph_pg_degraded{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Degraded
- refId: A
- step: 60
- - expr: sum(ceph_pg_stale{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Stale
- refId: B
- step: 60
- - expr: sum(ceph_pg_undersized{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Undersized
- refId: C
- step: 60
- timeFrom:
- timeShift:
- title: Stuck PGs
- tooltip:
- msResolution: false
- shared: true
- sort: 1
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- title: New row
- time:
- from: now-1h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - current: {}
- hide: 0
- label: Cluster
- name: ceph_cluster
- options: []
- type: query
- query: label_values(ceph_health_status, release_group)
- refresh: 1
- sort: 2
- datasource: "${DS_PROMETHEUS}"
- - auto: true
- auto_count: 10
- auto_min: 1m
- current:
- tags: []
- text: 1m
- value: 1m
- datasource:
- hide: 0
- includeAll: false
- label: Interval
- multi: false
- name: interval
- options:
- - selected: false
- text: auto
- value: "$__auto_interval"
- - selected: true
- text: 1m
- value: 1m
- - selected: false
- text: 10m
- value: 10m
- - selected: false
- text: 30m
- value: 30m
- - selected: false
- text: 1h
- value: 1h
- - selected: false
- text: 6h
- value: 6h
- - selected: false
- text: 12h
- value: 12h
- - selected: false
- text: 1d
- value: 1d
- - selected: false
- text: 7d
- value: 7d
- - selected: false
- text: 14d
- value: 14d
- - selected: false
- text: 30d
- value: 30d
- query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d
- refresh: 0
- type: interval
- annotations:
- list: []
- refresh: 5m
- schemaVersion: 12
- version: 26
- links: []
- gnetId: 917
- description: "Ceph Cluster overview.\r\n"
- ceph_osd:
- __inputs:
- - name: DS_PROMETHEUS
- label: Prometheus
- description: Prometheus.IO
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: grafana
- id: grafana
- name: Grafana
- version: 3.1.1
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- id:
- title: Ceph - OSD
- tags:
- - ceph
- - osd
- style: dark
- timezone: browser
- editable: true
- hideControls: false
- sharedCrosshair: false
- rows:
- - collapse: false
- editable: true
- height: 100px
- panels:
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 40, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 6
- interval:
- isNew: true
- links: []
- mappingType: 2
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- - from: '0'
- text: DOWN
- to: '0.99'
- - from: '0.99'
- text: UP
- to: '1'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: ceph_osd_up{ceph_daemon="$osd",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- refId: A
- step: 60
- thresholds: '0,1'
- timeFrom:
- title: Status
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: DOWN
- value: '0'
- - op: "="
- text: UP
- value: '1'
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 40, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 8
- interval:
- isNew: true
- links: []
- mappingType: 2
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- - from: '0'
- text: OUT
- to: '0.99'
- - from: '0.99'
- text: IN
- to: '1'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: ceph_osd_in{ceph_daemon="$osd",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- refId: A
- step: 60
- thresholds: '0,1'
- timeFrom:
- title: Available
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: DOWN
- value: '0'
- - op: "="
- text: UP
- value: '1'
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 10
- interval:
- isNew: true
- links: []
- mappingType: 2
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: count(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- refId: A
- step: 60
- thresholds: '0,1'
- timeFrom:
- title: Total OSDs
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: DOWN
- value: '0'
- - op: "="
- text: UP
- value: '1'
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- title: New row
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- grid:
- threshold1: 250
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2: 300
- threshold2Color: rgba(234, 112, 112, 0.22)
- thresholdLine: true
- id: 5
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/^Average.*/"
- fill: 0
- stack: false
- span: 10
- stack: true
- steppedLine: false
- targets:
- - expr: ceph_osd_numpg{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Number of PGs - {{ $osd }}
- refId: A
- step: 60
- - expr: avg(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Average Number of PGs in the Cluster
- refId: B
- step: 60
- timeFrom:
- timeShift:
- title: PGs
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 7
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: true
- targets:
- - expr: (ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}/ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"})*100
- interval: "$interval"
- intervalFactor: 1
- legendFormat: ''
- refId: A
- step: 60
- thresholds: '60,80'
- timeFrom:
- title: Utilization
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- showTitle: true
- title: 'OSD: $osd'
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 2
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: true
- steppedLine: false
- targets:
- - expr: ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Used - {{ osd.$osd }}
- metric: ceph_osd_used_bytes
- refId: A
- step: 60
- - expr: ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}
- hide: false
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Available - {{ $osd }}
- metric: ceph_osd_avail_bytes
- refId: B
- step: 60
- timeFrom:
- timeShift:
- title: OSD Storage
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 5
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 9
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: false
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 2
- points: true
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: (ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}/ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Available - {{ $osd }}
- metric: ceph_osd_avail_bytes
- refId: A
- step: 60
- timeFrom:
- timeShift:
- title: Utilization Variance
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: none
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: none
- label:
- logBase: 1
- max:
- min:
- show: true
- time:
- from: now-1h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - current: {}
- hide: 0
- label: Cluster
- name: ceph_cluster
- options: []
- type: query
- query: label_values(ceph_health_status, release_group)
- refresh: 1
- sort: 2
- datasource: "${DS_PROMETHEUS}"
- - auto: true
- auto_count: 10
- auto_min: 1m
- current:
- selected: true
- text: 1m
- value: 1m
- datasource:
- hide: 0
- includeAll: false
- label: Interval
- multi: false
- name: interval
- options:
- - selected: false
- text: auto
- value: "$__auto_interval"
- - selected: true
- text: 1m
- value: 1m
- - selected: false
- text: 10m
- value: 10m
- - selected: false
- text: 30m
- value: 30m
- - selected: false
- text: 1h
- value: 1h
- - selected: false
- text: 6h
- value: 6h
- - selected: false
- text: 12h
- value: 12h
- - selected: false
- text: 1d
- value: 1d
- - selected: false
- text: 7d
- value: 7d
- - selected: false
- text: 14d
- value: 14d
- - selected: false
- text: 30d
- value: 30d
- query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d
- refresh: 0
- type: interval
- - current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label: OSD
- multi: false
- name: osd
- options: []
- query: label_values(ceph_osd_metadata{release_group="$ceph_cluster"}, ceph_daemon)
- refresh: 1
- regex: ''
- type: query
- annotations:
- list: []
- refresh: 15m
- schemaVersion: 12
- version: 18
- links: []
- gnetId: 923
- description: CEPH OSD Status.
- ceph_pool:
- __inputs:
- - name: DS_PROMETHEUS
- label: Prometheus
- description: Prometheus.IO
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- - type: grafana
- id: grafana
- name: Grafana
- version: 3.1.1
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- id:
- title: Ceph - Pools
- tags:
- - ceph
- - pools
- style: dark
- timezone: browser
- editable: true
- hideControls: false
- sharedCrosshair: false
- rows:
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 4
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- height: ''
- id: 2
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- rightSide: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 0
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/^Total.*$/"
- fill: 0
- linewidth: 4
- stack: false
- - alias: "/^Raw.*$/"
- color: "#BF1B00"
- fill: 0
- linewidth: 4
- span: 10
- stack: true
- steppedLine: false
- targets:
- - expr: ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Total - {{ $pool }}
- refId: A
- step: 60
- - expr: ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Used - {{ $pool }}
- refId: B
- step: 60
- - expr: ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Available - {{ $pool }}
- refId: C
- step: 60
- - expr: ceph_pool_raw_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Raw - {{ $pool }}
- refId: D
- step: 60
- timeFrom:
- timeShift:
- title: "[[pool_name]] Pool Storage"
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: percentunit
- gauge:
- maxValue: 1
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 10
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: (ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} / ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"})
- interval: "$interval"
- intervalFactor: 1
- refId: A
- step: 60
- thresholds: ''
- title: "[[pool_name]] Pool Usage"
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- showTitle: true
- title: 'Pool: $pool'
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- height: ''
- id: 7
- isNew: true
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: ceph_pool_objects{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Objects - {{ $pool_name }}
- refId: A
- step: 60
- - expr: ceph_pool_dirty{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Dirty Objects - {{ $pool_name }}
- refId: B
- step: 60
- timeFrom:
- timeShift:
- title: Objects in Pool [[pool_name]]
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- thresholdLine: false
- id: 4
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: true
- steppedLine: false
- targets:
- - expr: irate(ceph_pool_rd{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}[3m])
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Read - {{ $pool_name }}
- refId: B
- step: 60
- - expr: irate(ceph_pool_wr{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}[3m])
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Write - {{ $pool_name }}
- refId: A
- step: 60
- timeFrom:
- timeShift:
- title: "[[pool_name]] Pool IOPS"
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: none
- label: IOPS
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label: IOPS
- logBase: 1
- max:
- min: 0
- show: false
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 5
- interval: "$interval"
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: true
- steppedLine: false
- targets:
- - expr: irate(ceph_pool_rd_bytes{pool_id="$pool",application="ceph",release_group="$ceph_cluster"}[3m])
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Read Bytes - {{ $pool_name }}
- refId: A
- step: 60
- - expr: irate(ceph_pool_wr_bytes{pool_id="$pool",application="ceph",release_group="$ceph_cluster"}[3m])
- interval: "$interval"
- intervalFactor: 1
- legendFormat: Written Bytes - {{ $pool_name }}
- refId: B
- step: 60
- timeFrom:
- timeShift:
- title: "[[pool_name]] Pool Throughput"
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: Bps
- label:
- logBase: 1
- max:
- min: 0
- show: true
- - format: Bps
- label:
- logBase: 1
- max:
- min: 0
- show: true
- title: New row
- time:
- from: now-3h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - current: {}
- hide: 0
- label: Cluster
- name: ceph_cluster
- options: []
- type: query
- query: label_values(ceph_health_status, release_group)
- refresh: 1
- sort: 2
- datasource: "${DS_PROMETHEUS}"
- - auto: true
- auto_count: 10
- auto_min: 1m
- current:
- selected: true
- text: 1m
- value: 1m
- datasource:
- hide: 0
- includeAll: false
- label: Interval
- multi: false
- name: interval
- options:
- - selected: false
- text: auto
- value: "$__auto_interval"
- - selected: true
- text: 1m
- value: 1m
- - selected: false
- text: 10m
- value: 10m
- - selected: false
- text: 30m
- value: 30m
- - selected: false
- text: 1h
- value: 1h
- - selected: false
- text: 6h
- value: 6h
- - selected: false
- text: 12h
- value: 12h
- - selected: false
- text: 1d
- value: 1d
- - selected: false
- text: 7d
- value: 7d
- - selected: false
- text: 14d
- value: 14d
- - selected: false
- text: 30d
- value: 30d
- query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d
- refresh: 0
- type: interval
- - current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label: Pool
- multi: false
- name: pool
- options: []
- query: label_values(ceph_pool_objects{release_group="$ceph_cluster"}, pool_id)
- refresh: 1
- regex: ''
- type: query
- - current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label: Pool
- multi: false
- name: pool_name
- options: []
- query: label_values(ceph_pool_metadata{release_group="$ceph_cluster",pool_id="[[pool]]" }, name)
- refresh: 1
- regex: ''
- type: query
- annotations:
- list: []
- refresh: 5m
- schemaVersion: 12
- version: 22
- links: []
- gnetId: 926
- description: Ceph Pools dashboard.
- containers:
- __inputs:
- - name: DS_PROMETHEUS
- label: Prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- - type: grafana
- id: grafana
- name: Grafana
- version: 3.1.1
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.3.0
- id:
- title: Container Metrics (cAdvisor)
- description: Monitors Kubernetes cluster using Prometheus. Shows overall cluster CPU
- / Memory / Filesystem usage as well as individual pod, containers, systemd services
- statistics. Uses cAdvisor metrics only.
- tags:
- - kubernetes
- style: dark
- timezone: browser
- editable: true
- hideControls: false
- sharedCrosshair: false
- rows:
- - collapse: false
- editable: true
- height: 200px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- thresholdLine: false
- height: 200px
- id: 32
- isNew: true
- legend:
- alignAsTable: false
- avg: true
- current: true
- max: false
- min: false
- rightSide: false
- show: false
- sideWidth: 200
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: false
- targets:
- - expr: sum (rate (container_network_receive_bytes_total{kubernetes_io_hostname=~"^$Node$"}[5m]))
- interval: 10s
- intervalFactor: 1
- legendFormat: Received
- metric: network
- refId: A
- step: 10
- - expr: '- sum (rate (container_network_transmit_bytes_total{kubernetes_io_hostname=~"^$Node$"}[5m]))'
- interval: 10s
- intervalFactor: 1
- legendFormat: Sent
- metric: network
- refId: B
- step: 10
- timeFrom:
- timeShift:
- title: Network I/O pressure
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: Bps
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: Bps
- label:
- logBase: 1
- max:
- min:
- show: false
- title: Network I/O pressure
- - collapse: false
- editable: true
- height: 250px
- panels:
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- height: 180px
- id: 4
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (container_memory_working_set_bytes{id="/",kubernetes_io_hostname=~"^$Node$"})
- / sum (machine_memory_bytes{kubernetes_io_hostname=~"^$Node$"}) * 100
- interval: 10s
- intervalFactor: 1
- refId: A
- step: 10
- thresholds: 65, 90
- title: Cluster memory usage
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- height: 180px
- id: 6
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (rate (container_cpu_usage_seconds_total{id="/",kubernetes_io_hostname=~"^$Node$"}[5m]))
- / sum (machine_cpu_cores{kubernetes_io_hostname=~"^$Node$"}) * 100
- interval: 10s
- intervalFactor: 1
- refId: A
- step: 10
- thresholds: 65, 90
- title: Cluster CPU usage (5m avg)
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- height: 180px
- id: 7
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (container_fs_usage_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"})
- / sum (container_fs_limit_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"})
- * 100
- interval: 10s
- intervalFactor: 1
- legendFormat: ''
- metric: ''
- refId: A
- step: 10
- thresholds: 65, 90
- title: Cluster filesystem usage
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: bytes
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: 1px
- id: 9
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 20%
- prefix: ''
- prefixFontSize: 20%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (container_memory_working_set_bytes{id="/",kubernetes_io_hostname=~"^$Node$"})
- interval: 10s
- intervalFactor: 1
- refId: A
- step: 10
- thresholds: ''
- title: Used
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: bytes
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: 1px
- id: 10
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (machine_memory_bytes{kubernetes_io_hostname=~"^$Node$"})
- interval: 10s
- intervalFactor: 1
- refId: A
- step: 10
- thresholds: ''
- title: Total
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: 1px
- id: 11
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: " cores"
- postfixFontSize: 30%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (rate (container_cpu_usage_seconds_total{id="/",kubernetes_io_hostname=~"^$Node$"}[5m]))
- interval: 10s
- intervalFactor: 1
- refId: A
- step: 10
- thresholds: ''
- title: Used
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: 1px
- id: 12
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: " cores"
- postfixFontSize: 30%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (machine_cpu_cores{kubernetes_io_hostname=~"^$Node$"})
- interval: 10s
- intervalFactor: 1
- refId: A
- step: 10
- thresholds: ''
- title: Total
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: bytes
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: 1px
- id: 13
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (container_fs_usage_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"})
- interval: 10s
- intervalFactor: 1
- refId: A
- step: 10
- thresholds: ''
- title: Used
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- format: bytes
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: 1px
- id: 14
- interval:
- isNew: true
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: sum (container_fs_limit_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"})
- interval: 10s
- intervalFactor: 1
- refId: A
- step: 10
- thresholds: ''
- title: Total
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- showTitle: false
- title: Total usage
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 3
- editable: true
- error: false
- fill: 0
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- height: ''
- id: 17
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: true
- show: true
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: true
- targets:
- - expr: sum (rate (container_cpu_usage_seconds_total{image!="",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (pod)
- interval: 10s
- intervalFactor: 1
- legendFormat: "{{ pod }}"
- metric: container_cpu
- refId: A
- step: 10
- timeFrom:
- timeShift:
- title: Pods CPU usage (5m avg)
- tooltip:
- msResolution: true
- shared: true
- sort: 2
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: none
- label: cores
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- showTitle: false
- title: Pods CPU usage
- - collapse: true
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 3
- editable: true
- error: false
- fill: 0
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- height: ''
- id: 24
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: false
- min: false
- rightSide: true
- show: true
- sideWidth:
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: true
- targets:
- - expr: sum (rate (container_cpu_usage_seconds_total{image!="",name=~"^k8s_.*",container!="POD",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (container, pod)
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: 'pod: {{ pod }} | {{ container }}'
- metric: container_cpu
- refId: A
- step: 10
- - expr: sum (rate (container_cpu_usage_seconds_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (kubernetes_io_hostname, name, image)
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: 'docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})'
- metric: container_cpu
- refId: B
- step: 10
- - expr: sum (rate (container_cpu_usage_seconds_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (kubernetes_io_hostname, rkt_container_name)
- interval: 10s
- intervalFactor: 1
- legendFormat: 'rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}'
- metric: container_cpu
- refId: C
- step: 10
- timeFrom:
- timeShift:
- title: Containers CPU usage (5m avg)
- tooltip:
- msResolution: true
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: none
- label: cores
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- title: Containers CPU usage
- - collapse: true
- editable: true
- height: 500px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 3
- editable: true
- error: false
- fill: 0
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 20
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: false
- show: true
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: true
- targets:
- - expr: sum (rate (container_cpu_usage_seconds_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (id)
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: "{{ id }}"
- metric: container_cpu
- refId: A
- step: 10
- timeFrom:
- timeShift:
- title: All processes CPU usage (5m avg)
- tooltip:
- msResolution: true
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: none
- label: cores
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- repeat:
- showTitle: false
- title: All processes CPU usage
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 0
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 25
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: true
- show: true
- sideWidth: 200
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: true
- targets:
- - expr: sum (container_memory_working_set_bytes{image!="",kubernetes_io_hostname=~"^$Node$"})
- by (pod)
- interval: 10s
- intervalFactor: 1
- legendFormat: "{{ pod }}"
- metric: container_memory_usage:sort_desc
- refId: A
- step: 10
- timeFrom:
- timeShift:
- title: Pods memory usage
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- title: Pods memory usage
- - collapse: true
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 0
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 27
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: true
- show: true
- sideWidth: 200
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: true
- targets:
- - expr: sum (container_memory_working_set_bytes{image!="",name=~"^k8s_.*",container!="POD",kubernetes_io_hostname=~"^$Node$"})
- by (container, pod)
- interval: 10s
- intervalFactor: 1
- legendFormat: 'pod: {{ pod }} | {{ container }}'
- metric: container_memory_usage:sort_desc
- refId: A
- step: 10
- - expr: sum (container_memory_working_set_bytes{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"})
- by (kubernetes_io_hostname, name, image)
- interval: 10s
- intervalFactor: 1
- legendFormat: 'docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})'
- metric: container_memory_usage:sort_desc
- refId: B
- step: 10
- - expr: sum (container_memory_working_set_bytes{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"})
- by (kubernetes_io_hostname, rkt_container_name)
- interval: 10s
- intervalFactor: 1
- legendFormat: 'rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}'
- metric: container_memory_usage:sort_desc
- refId: C
- step: 10
- timeFrom:
- timeShift:
- title: Containers memory usage
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- title: Containers memory usage
- - collapse: true
- editable: true
- height: 500px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 0
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 28
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: false
- show: true
- sideWidth: 200
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: true
- targets:
- - expr: sum (container_memory_working_set_bytes{id!="/",kubernetes_io_hostname=~"^$Node$"})
- by (id)
- interval: 10s
- intervalFactor: 1
- legendFormat: "{{ id }}"
- metric: container_memory_usage:sort_desc
- refId: A
- step: 10
- timeFrom:
- timeShift:
- title: All processes memory usage
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- title: All processes memory usage
- - collapse: false
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 16
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: true
- show: true
- sideWidth: 200
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: false
- targets:
- - expr: sum (rate (container_network_receive_bytes_total{image!="",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (pod)
- interval: 10s
- intervalFactor: 1
- legendFormat: "-> {{ pod }}"
- metric: network
- refId: A
- step: 10
- - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (pod)'
- interval: 10s
- intervalFactor: 1
- legendFormat: "<- {{ pod }}"
- metric: network
- refId: B
- step: 10
- timeFrom:
- timeShift:
- title: Pods network I/O (5m avg)
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: Bps
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- title: Pods network I/O
- - collapse: true
- editable: true
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 30
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: true
- show: true
- sideWidth: 200
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: false
- targets:
- - expr: sum (rate (container_network_receive_bytes_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (container, pod)
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: "-> pod: {{ pod }} | {{ container }}"
- metric: network
- refId: B
- step: 10
- - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (container, pod)'
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: "<- pod: {{ pod }} | {{ container }}"
- metric: network
- refId: D
- step: 10
- - expr: sum (rate (container_network_receive_bytes_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (kubernetes_io_hostname, name, image)
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: "-> docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name
- }})"
- metric: network
- refId: A
- step: 10
- - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (kubernetes_io_hostname, name, image)'
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: "<- docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name
- }})"
- metric: network
- refId: C
- step: 10
- - expr: sum (rate (container_network_transmit_bytes_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (kubernetes_io_hostname, rkt_container_name)
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: "-> rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name
- }}"
- metric: network
- refId: E
- step: 10
- - expr: '- sum (rate (container_network_transmit_bytes_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (kubernetes_io_hostname, rkt_container_name)'
- hide: false
- interval: 10s
- intervalFactor: 1
- legendFormat: "<- rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name
- }}"
- metric: network
- refId: F
- step: 10
- timeFrom:
- timeShift:
- title: Containers network I/O (5m avg)
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: Bps
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- title: Containers network I/O
- - collapse: true
- editable: true
- height: 500px
- panels:
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- grid:
- threshold1:
- threshold1Color: rgba(216, 200, 27, 0.27)
- threshold2:
- threshold2Color: rgba(234, 112, 112, 0.22)
- id: 29
- isNew: true
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: false
- min: false
- rightSide: false
- show: true
- sideWidth: 200
- sort: current
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 12
- stack: false
- steppedLine: false
- targets:
- - expr: sum (rate (container_network_receive_bytes_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (id)
- interval: 10s
- intervalFactor: 1
- legendFormat: "-> {{ id }}"
- metric: network
- refId: A
- step: 10
- - expr: '- sum (rate (container_network_transmit_bytes_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m]))
- by (id)'
- interval: 10s
- intervalFactor: 1
- legendFormat: "<- {{ id }}"
- metric: network
- refId: B
- step: 10
- timeFrom:
- timeShift:
- title: All processes network I/O (5m avg)
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- show: true
- yaxes:
- - format: Bps
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- title: All processes network I/O
- time:
- from: now-5m
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - allValue: ".*"
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: true
- multi: false
- name: Node
- options: []
- query: label_values(kubernetes_io_hostname)
- refresh: 1
- type: query
- annotations:
- list: []
- refresh: 5m
- schemaVersion: 12
- version: 13
- links: []
- gnetId: 315
- coredns:
- __inputs:
- - name: prometheus
- label: Prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.4.3
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- annotations:
- list: []
- editable: true
- gnetId: 5926
- graphTooltip: 0
- hideControls: false
- id:
- links: []
- rows:
- - collapse: false
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 1
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: total
- yaxis: 2
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m]))
- by (proto)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{proto}}"
- refId: A
- step: 60
- - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m]))
- format: time_series
- intervalFactor: 2
- legendFormat: total
- refId: B
- step: 60
- thresholds: []
- timeFrom:
- timeShift:
- title: Requests (total)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 12
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: total
- yaxis: 2
- - alias: other
- yaxis: 2
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(coredns_dns_request_type_count_total{instance=~"$instance"}[5m]))
- by (type)
- intervalFactor: 2
- legendFormat: "{{type}}"
- refId: A
- step: 60
- thresholds: []
- timeFrom:
- timeShift:
- title: Requests (by qtype)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 2
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: total
- yaxis: 2
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m]))
- by (zone)
- intervalFactor: 2
- legendFormat: "{{zone}}"
- refId: A
- step: 60
- - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m]))
- intervalFactor: 2
- legendFormat: total
- refId: B
- step: 60
- thresholds: []
- timeFrom:
- timeShift:
- title: Requests (by zone)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 10
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: total
- yaxis: 2
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(coredns_dns_request_do_count_total{instance=~"$instance"}[5m]))
- intervalFactor: 2
- legendFormat: DO
- refId: A
- step: 40
- - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m]))
- intervalFactor: 2
- legendFormat: total
- refId: B
- step: 40
- thresholds: []
- timeFrom:
- timeShift:
- title: Requests (DO bit)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - format: pps
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 9
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: tcp:90
- yaxis: 2
- - alias: 'tcp:99 '
- yaxis: 2
- - alias: tcp:50
- yaxis: 2
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m]))
- by (le,proto))
- intervalFactor: 2
- legendFormat: "{{proto}}:99 "
- refId: A
- step: 60
- - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m]))
- by (le,proto))
- intervalFactor: 2
- legendFormat: "{{proto}}:90"
- refId: B
- step: 60
- - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m]))
- by (le,proto))
- intervalFactor: 2
- legendFormat: "{{proto}}:50"
- refId: C
- step: 60
- thresholds: []
- timeFrom:
- timeShift:
- title: Requests (size, udp)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 14
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: tcp:90
- yaxis: 1
- - alias: 'tcp:99 '
- yaxis: 1
- - alias: tcp:50
- yaxis: 1
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m]))
- by (le,proto))
- intervalFactor: 2
- legendFormat: "{{proto}}:99 "
- refId: A
- step: 60
- - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m]))
- by (le,proto))
- intervalFactor: 2
- legendFormat: "{{proto}}:90"
- refId: B
- step: 60
- - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m]))
- by (le,proto))
- intervalFactor: 2
- legendFormat: "{{proto}}:50"
- refId: C
- step: 60
- thresholds: []
- timeFrom:
- timeShift:
- title: Requests (size,tcp)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Row
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 5
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(coredns_dns_response_rcode_count_total{instance=~"$instance"}[5m]))
- by (rcode)
- intervalFactor: 2
- legendFormat: "{{rcode}}"
- refId: A
- step: 40
- thresholds: []
- timeFrom:
- timeShift:
- title: Responses (by rcode)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 3
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m]))
- by (le, job))
- intervalFactor: 2
- legendFormat: 99%
- refId: A
- step: 40
- - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m]))
- by (le))
- intervalFactor: 2
- legendFormat: 90%
- refId: B
- step: 40
- - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m]))
- by (le))
- intervalFactor: 2
- legendFormat: 50%
- refId: C
- step: 40
- thresholds: []
- timeFrom:
- timeShift:
- title: Responses (duration)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 8
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: udp:50%
- yaxis: 1
- - alias: tcp:50%
- yaxis: 2
- - alias: tcp:90%
- yaxis: 2
- - alias: tcp:99%
- yaxis: 2
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: 'histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m]))
- by (le,proto)) '
- intervalFactor: 2
- legendFormat: "{{proto}}:99%"
- refId: A
- step: 40
- - expr: 'histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance="$instance",proto="udp"}[5m]))
- by (le,proto)) '
- intervalFactor: 2
- legendFormat: "{{proto}}:90%"
- refId: B
- step: 40
- - expr: 'histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m]))
- by (le,proto)) '
- intervalFactor: 2
- legendFormat: "{{proto}}:50%"
- metric: ''
- refId: C
- step: 40
- thresholds: []
- timeFrom:
- timeShift:
- title: Responses (size, udp)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 13
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: udp:50%
- yaxis: 1
- - alias: tcp:50%
- yaxis: 1
- - alias: tcp:90%
- yaxis: 1
- - alias: tcp:99%
- yaxis: 1
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: 'histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m]))
- by (le,proto)) '
- intervalFactor: 2
- legendFormat: "{{proto}}:99%"
- refId: A
- step: 40
- - expr: 'histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m]))
- by (le,proto)) '
- intervalFactor: 2
- legendFormat: "{{proto}}:90%"
- refId: B
- step: 40
- - expr: 'histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m]))
- by (le, proto)) '
- intervalFactor: 2
- legendFormat: "{{proto}}:50%"
- metric: ''
- refId: C
- step: 40
- thresholds: []
- timeFrom:
- timeShift:
- title: Responses (size, tcp)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 15
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(coredns_cache_size{instance=~"$instance"}) by (type)
- intervalFactor: 2
- legendFormat: "{{type}}"
- refId: A
- step: 40
- thresholds: []
- timeFrom:
- timeShift:
- title: Cache (size)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 16
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: misses
- yaxis: 2
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(coredns_cache_hits_total{instance=~"$instance"}[5m])) by (type)
- intervalFactor: 2
- legendFormat: hits:{{type}}
- refId: A
- step: 40
- - expr: sum(rate(coredns_cache_misses_total{instance=~"$instance"}[5m])) by (type)
- intervalFactor: 2
- legendFormat: misses
- refId: B
- step: 40
- thresholds: []
- timeFrom:
- timeShift:
- title: Cache (hitrate)
- tooltip:
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- - format: pps
- logBase: 1
- max:
- min: 0
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags:
- - dns
- - coredns
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - allValue: ".*"
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: true
- label: Instance
- multi: false
- name: instance
- options: []
- query: up{job="coredns"}
- refresh: 1
- regex: .*instance="(.*?)".*
- sort: 0
- tagValuesQuery: ''
- tags: []
- tagsQuery: ''
- type: query
- useTags: false
- time:
- from: now-3h
- to: now
- timepicker:
- now: true
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: utc
- title: CoreDNS
- version: 3
- description: A dashboard for the CoreDNS DNS server.
- elasticsearch:
- __inputs:
- - name: DS_PROMETHEUS
- label: Prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.6.3
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- annotations:
- list:
- - builtIn: 1
- datasource: "-- Grafana --"
- enable: true
- hide: true
- iconColor: rgba(0, 211, 255, 1)
- name: Annotations & Alerts
- type: dashboard
- editable: true
- gnetId: 4358
- graphTooltip: 1
- hideControls: false
- id:
- links: []
- refresh: 5m
- rows:
- - collapse: false
- height:
- panels:
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(178, 49, 13, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- id: 8
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 5
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - expr: (sum(elasticsearch_cluster_health_status{cluster=~"$cluster",color="green"})*2)+sum(elasticsearch_cluster_health_status{cluster=~"$cluster",color="yellow"})
- format: time_series
- intervalFactor: 3
- legendFormat: ''
- metric: ''
- refId: A
- step: 40
- thresholds: '0,1,2'
- title: Cluster health status
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: GREEN
- value: '2'
- - op: "="
- text: YELLOW
- value: '1'
- - op: "="
- text: RED
- value: '0'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- id: 10
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: sum(elasticsearch_cluster_health_number_of_nodes{cluster=~"$cluster"})
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: ''
- metric: ''
- refId: A
- step: 40
- thresholds: ''
- title: Nodes
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- id: 9
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: elasticsearch_cluster_health_number_of_data_nodes{cluster="$cluster"}
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: ''
- metric: ''
- refId: A
- step: 40
- thresholds: ''
- title: Data nodes
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- hideTimeOverride: true
- id: 16
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - expr: elasticsearch_cluster_health_number_of_pending_tasks{cluster="$cluster"}
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: ''
- metric: ''
- refId: A
- step: 40
- thresholds: ''
- title: Pending tasks
- transparent: false
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Cluster
- titleSize: h6
- - collapse: false
- height: ''
- panels:
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- id: 11
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- minSpan: 2
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- repeat: shard_type
- span: 2.4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - expr: elasticsearch_cluster_health_active_primary_shards{cluster="$cluster"}
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 40
- thresholds: ''
- title: active primary shards
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- id: 39
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- minSpan: 2
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2.4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - expr: elasticsearch_cluster_health_active_shards{cluster="$cluster"}
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 40
- thresholds: ''
- title: active shards
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- id: 40
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- minSpan: 2
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2.4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - expr: elasticsearch_cluster_health_initializing_shards{cluster="$cluster"}
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 40
- thresholds: ''
- title: initializing shards
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- id: 41
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- minSpan: 2
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2.4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - expr: elasticsearch_cluster_health_relocating_shards{cluster="$cluster"}
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 40
- thresholds: ''
- title: relocating shards
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- height: '50'
- id: 42
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- minSpan: 2
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2.4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: true
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - expr: elasticsearch_cluster_health_unassigned_shards{cluster="$cluster"}
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 40
- thresholds: ''
- title: unassigned shards
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Shards
- titleSize: h6
- - collapse: false
- height:
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 30
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: elasticsearch_process_cpu_percent{cluster="$cluster",es_master_node="true",name=~"$node"}
- format: time_series
- instant: false
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ name }} - master"
- metric: ''
- refId: A
- step: 10
- - expr: elasticsearch_process_cpu_percent{cluster="$cluster",es_data_node="true",name=~"$node"}
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ name }} - data"
- metric: ''
- refId: B
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: CPU usage
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: percent
- label: CPU usage
- logBase: 1
- max: 100
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 0
- grid: {}
- height: '400'
- id: 31
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: elasticsearch_jvm_memory_used_bytes{cluster="$cluster",name=~"$node",name=~"$node"}
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ name }} - used: {{area}}"
- metric: ''
- refId: A
- step: 10
- - expr: elasticsearch_jvm_memory_committed_bytes{cluster="$cluster",name=~"$node",name=~"$node"}
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - committed: {{area}}"
- refId: B
- step: 10
- - expr: elasticsearch_jvm_memory_max_bytes{cluster="$cluster",name=~"$node",name=~"$node"}
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - max: {{area}}"
- refId: C
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: JVM memory usage
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label: Memory
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 32
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: 1-(elasticsearch_filesystem_data_available_bytes{cluster="$cluster"}/elasticsearch_filesystem_data_size_bytes{cluster="$cluster",name=~"$node"})
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ name }} - {{path}}"
- metric: ''
- refId: A
- step: 10
- thresholds:
- - colorMode: custom
- fill: true
- fillColor: rgba(216, 200, 27, 0.27)
- op: gt
- value: 0.8
- - colorMode: custom
- fill: true
- fillColor: rgba(234, 112, 112, 0.22)
- op: gt
- value: 0.9
- timeFrom:
- timeShift:
- title: Disk usage
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: percentunit
- label: Disk Usage %
- logBase: 1
- max: 1
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 47
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- sort: max
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: sent
- transform: negative-Y
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: irate(elasticsearch_transport_tx_size_bytes_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} -sent"
- refId: D
- step: 10
- - expr: irate(elasticsearch_transport_rx_size_bytes_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} -received"
- refId: C
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Network usage
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: Bps
- label: Bytes/sec
- logBase: 1
- max:
- min:
- show: true
- - format: pps
- label: ''
- logBase: 1
- max:
- min:
- show: false
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: System
- titleSize: h6
- - collapse: false
- height: ''
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 1
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: true
- steppedLine: false
- targets:
- - expr: elasticsearch_indices_docs{cluster="$cluster",name=~"$node"}
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ name }}"
- metric: ''
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Documents count
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: Documents
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 24
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: true
- steppedLine: false
- targets:
- - expr: irate(elasticsearch_indices_indexing_index_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Documents indexed rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: index calls/s
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 25
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: true
- steppedLine: false
- targets:
- - expr: rate(elasticsearch_indices_docs_deleted{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Documents deleted rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: Documents/s
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 26
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: true
- steppedLine: false
- targets:
- - expr: rate(elasticsearch_indices_merges_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Documents merged rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: Documents/s
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Documents
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 48
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- sort: avg
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: irate(elasticsearch_indices_indexing_index_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ name }} - indexing"
- metric: ''
- refId: A
- step: 4
- - expr: irate(elasticsearch_indices_search_query_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - query"
- refId: B
- step: 4
- - expr: irate(elasticsearch_indices_search_fetch_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - fetch"
- refId: C
- step: 4
- - expr: irate(elasticsearch_indices_merges_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - merges"
- refId: D
- step: 4
- - expr: irate(elasticsearch_indices_refresh_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - refresh"
- refId: E
- step: 4
- - expr: irate(elasticsearch_indices_flush_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - flush"
- refId: F
- step: 4
- thresholds: []
- timeFrom:
- timeShift:
- title: Total Operations rate
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: Operations/s
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 49
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- sort: avg
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: irate(elasticsearch_indices_indexing_index_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ name }} - indexing"
- metric: ''
- refId: A
- step: 4
- - expr: irate(elasticsearch_indices_search_query_time_ms_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - query"
- refId: B
- step: 4
- - expr: irate(elasticsearch_indices_search_fetch_time_ms_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - fetch"
- refId: C
- step: 4
- - expr: irate(elasticsearch_indices_merges_total_time_ms_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - merges"
- refId: D
- step: 4
- - expr: irate(elasticsearch_indices_refresh_total_time_ms_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - refresh"
- refId: E
- step: 4
- - expr: irate(elasticsearch_indices_flush_time_ms_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ name }} - flush"
- refId: F
- step: 4
- thresholds: []
- timeFrom:
- timeShift:
- title: Total Operations time
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: ms
- label: Time
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Total Operations stats
- titleSize: h6
- - collapse: false
- height: ''
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 33
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: 'rate(elasticsearch_indices_search_query_time_seconds{cluster="$cluster",name=~"$node"}[$interval]) '
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 4
- thresholds: []
- timeFrom:
- timeShift:
- title: Query time
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: ms
- label: Time
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 5
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: rate(elasticsearch_indices_indexing_index_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 4
- thresholds: []
- timeFrom:
- timeShift:
- title: Indexing time
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: ms
- label: Time
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 3
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: rate(elasticsearch_indices_merges_total_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 4
- thresholds: []
- timeFrom:
- timeShift:
- title: Merging time
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- label: Time
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Times
- titleSize: h6
- - collapse: false
- height:
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 4
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: true
- steppedLine: false
- targets:
- - expr: elasticsearch_indices_fielddata_memory_size_bytes{cluster="$cluster",name=~"$node"}
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Field data memory size
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label: Memory
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 34
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: true
- steppedLine: false
- targets:
- - expr: rate(elasticsearch_indices_fielddata_evictions{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Field data evictions
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: Evictions/s
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 35
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: true
- steppedLine: false
- targets:
- - expr: elasticsearch_indices_query_cache_memory_size_bytes{cluster="$cluster",name=~"$node"}
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Query cache size
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label: Size
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 36
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: true
- steppedLine: false
- targets:
- - expr: rate(elasticsearch_indices_query_cache_evictions{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}}"
- metric: ''
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Query cache evictions
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: Evictions/s
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Caches
- titleSize: h6
- - collapse: false
- height: 728
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 45
- legend:
- alignAsTable: true
- avg: true
- current: false
- max: true
- min: true
- show: true
- sort: avg
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: ' irate(elasticsearch_thread_pool_rejected_count{cluster="$cluster",name=~"$node"}[$interval])'
- format: time_series
- intervalFactor: 2
- legendFormat: "{{name}} - {{ type }}"
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Thread Pool operations rejected
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 46
- legend:
- alignAsTable: true
- avg: true
- current: false
- max: true
- min: true
- show: true
- sort: avg
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: elasticsearch_thread_pool_active_count{cluster="$cluster",name=~"$node"}
- format: time_series
- intervalFactor: 2
- legendFormat: "{{name}} - {{ type }}"
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Thread Pool operations queued
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- height: ''
- id: 43
- legend:
- alignAsTable: true
- avg: true
- current: false
- max: true
- min: true
- show: true
- sort: avg
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: elasticsearch_thread_pool_active_count{cluster="$cluster",name=~"$node"}
- format: time_series
- intervalFactor: 2
- legendFormat: "{{name}} - {{ type }}"
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Thread Pool threads active
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 44
- legend:
- alignAsTable: true
- avg: true
- current: false
- max: true
- min: true
- show: true
- sort: avg
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: irate(elasticsearch_thread_pool_completed_count{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- intervalFactor: 2
- legendFormat: "{{name}} - {{ type }}"
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Thread Pool operations completed
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Thread Pool
- titleSize: h6
- - collapse: false
- height:
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 7
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: true
- steppedLine: false
- targets:
- - expr: rate(elasticsearch_jvm_gc_collection_seconds_count{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}} - {{gc}}"
- metric: ''
- refId: A
- step: 4
- thresholds: []
- timeFrom:
- timeShift:
- title: GC count
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: GCs
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- height: '400'
- id: 27
- legend:
- alignAsTable: true
- avg: true
- current: true
- hideEmpty: false
- hideZero: false
- max: true
- min: true
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: rate(elasticsearch_jvm_gc_collection_seconds_count{cluster="$cluster",name=~"$node"}[$interval])
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{name}} - {{gc}}"
- metric: ''
- refId: A
- step: 4
- thresholds: []
- timeFrom:
- timeShift:
- title: GC time
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- transparent: false
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- label: Time
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: JVM Garbage Collection
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags:
- - elasticsearch
- - App
- templating:
- list:
- - auto: true
- auto_count: 30
- auto_min: 10s
- current:
- text: auto
- value: "$__auto_interval"
- hide: 0
- label: Interval
- name: interval
- options:
- - selected: true
- text: auto
- value: "$__auto_interval"
- - selected: false
- text: 1m
- value: 1m
- - selected: false
- text: 10m
- value: 10m
- - selected: false
- text: 30m
- value: 30m
- - selected: false
- text: 1h
- value: 1h
- - selected: false
- text: 6h
- value: 6h
- - selected: false
- text: 12h
- value: 12h
- - selected: false
- text: 1d
- value: 1d
- - selected: false
- text: 7d
- value: 7d
- - selected: false
- text: 14d
- value: 14d
- - selected: false
- text: 30d
- value: 30d
- query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d
- refresh: 2
- type: interval
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - allValue:
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label: Instance
- multi: false
- name: cluster
- options: []
- query: label_values(elasticsearch_cluster_health_status,cluster)
- refresh: 1
- regex: ''
- sort: 1
- tagValuesQuery:
- tags: []
- tagsQuery:
- type: query
- useTags: false
- - allValue:
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: true
- label: node
- multi: true
- name: node
- options: []
- query: label_values(elasticsearch_process_cpu_percent,name)
- refresh: 1
- regex: ''
- sort: 1
- tagValuesQuery:
- tags: []
- tagsQuery:
- type: query
- useTags: false
- time:
- from: now-12h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: browser
- title: Elasticsearch
- version: 1
- description: Elasticsearch detailed dashboard
- kubernetes_capacity_planning:
- __inputs:
- - name: DS_PROMETHEUS
- label: prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.4.1
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- annotations:
- list: []
- description: ''
- editable: true
- gnetId: 22
- graphTooltip: 0
- hideControls: false
- id:
- links: []
- refresh: false
- rows:
- - collapse: false
- height: 250px
- panels:
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 3
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(node_cpu{mode="idle"}[2m])) * 100
- hide: false
- intervalFactor: 10
- legendFormat: ''
- refId: A
- step: 50
- thresholds: []
- timeFrom:
- timeShift:
- title: Idle cpu
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: percent
- label: cpu usage
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 9
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(node_load1)
- intervalFactor: 4
- legendFormat: load 1m
- refId: A
- step: 20
- target: ''
- - expr: sum(node_load5)
- intervalFactor: 4
- legendFormat: load 5m
- refId: B
- step: 20
- target: ''
- - expr: sum(node_load15)
- intervalFactor: 4
- legendFormat: load 15m
- refId: C
- step: 20
- target: ''
- thresholds: []
- timeFrom:
- timeShift:
- title: System load
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: percentunit
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 4
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: node_memory_SwapFree{instance="172.17.0.1:9100",job="prometheus"}
- yaxis: 2
- spaceLength: 10
- span: 9
- stack: true
- steppedLine: false
- targets:
- - expr: sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers)
- - sum(node_memory_Cached)
- intervalFactor: 2
- legendFormat: memory usage
- metric: memo
- refId: A
- step: 10
- target: ''
- - expr: sum(node_memory_Buffers)
- interval: ''
- intervalFactor: 2
- legendFormat: memory buffers
- metric: memo
- refId: B
- step: 10
- target: ''
- - expr: sum(node_memory_Cached)
- interval: ''
- intervalFactor: 2
- legendFormat: memory cached
- metric: memo
- refId: C
- step: 10
- target: ''
- - expr: sum(node_memory_MemFree)
- interval: ''
- intervalFactor: 2
- legendFormat: memory free
- metric: memo
- refId: D
- step: 10
- target: ''
- thresholds: []
- timeFrom:
- timeShift:
- title: Memory usage
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 5
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: "((sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers)
- - sum(node_memory_Cached)) / sum(node_memory_MemTotal)) * 100"
- intervalFactor: 2
- metric: ''
- refId: A
- step: 60
- target: ''
- thresholds: 80, 90
- title: Memory usage
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: avg
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- - collapse: false
- height: 246
- panels:
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 6
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: read
- yaxis: 1
- - alias: '{instance="172.17.0.1:9100"}'
- yaxis: 2
- - alias: io time
- yaxis: 2
- spaceLength: 10
- span: 9
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(node_disk_bytes_read[5m]))
- hide: false
- intervalFactor: 4
- legendFormat: read
- refId: A
- step: 20
- target: ''
- - expr: sum(rate(node_disk_bytes_written[5m]))
- intervalFactor: 4
- legendFormat: written
- refId: B
- step: 20
- - expr: sum(rate(node_disk_io_time_ms[5m]))
- intervalFactor: 4
- legendFormat: io time
- refId: C
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Disk I/O
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: ms
- label:
- logBase: 1
- max:
- min:
- show: true
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: percentunit
- gauge:
- maxValue: 1
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 12
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: (sum(node_filesystem_size{device!="rootfs"}) - sum(node_filesystem_free{device!="rootfs"}))
- / sum(node_filesystem_size{device!="rootfs"})
- intervalFactor: 2
- refId: A
- step: 60
- target: ''
- thresholds: 0.75, 0.9
- title: Disk space usage
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 8
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: 'transmitted '
- yaxis: 2
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(node_network_receive_bytes{device!~"lo"}[5m]))
- hide: false
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 10
- target: ''
- thresholds: []
- timeFrom:
- timeShift:
- title: Network received
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 10
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: 'transmitted '
- yaxis: 2
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(node_network_transmit_bytes{device!~"lo"}[5m]))
- hide: false
- intervalFactor: 2
- legendFormat: ''
- refId: B
- step: 10
- target: ''
- thresholds: []
- timeFrom:
- timeShift:
- title: Network transmitted
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- - collapse: false
- height: 276
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 11
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 9
- stack: false
- steppedLine: false
- targets:
- - expr: sum(kube_pod_info)
- format: time_series
- intervalFactor: 2
- legendFormat: Current number of Pods
- refId: A
- step: 10
- - expr: sum(kube_node_status_capacity_pods)
- format: time_series
- intervalFactor: 2
- legendFormat: Maximum capacity of pods
- refId: B
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Cluster Pod Utilization
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 7
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: 100 - (sum(kube_node_status_capacity_pods) - sum(kube_pod_info)) / sum(kube_node_status_capacity_pods)
- * 100
- format: time_series
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 60
- target: ''
- thresholds: '80,90'
- title: Pod Utilization
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Dashboard Row
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags: []
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- time:
- from: now-1h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: browser
- title: Kubernetes Capacity Planning
- version: 4
- inputs:
- - name: prometheus
- pluginId: prometheus
- type: datasource
- value: prometheus
- overwrite: true
- kubernetes_cluster_status:
- __inputs:
- - name: prometheus
- label: prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.4.1
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- annotations:
- list: []
- editable: true
- gnetId:
- graphTooltip: 0
- hideControls: false
- id:
- links: []
- rows:
- - collapse: false
- height: 129
- panels:
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 5
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 6
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: sum(up{job=~"apiserver|kube-scheduler|kube-controller-manager"} == 0)
- format: time_series
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '1,3'
- title: Control Plane UP
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: UP
- value: 'null'
- valueName: total
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 6
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 6
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: sum(ALERTS{alertstate="firing",alertname!="DeadMansSwitch"})
- format: time_series
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '3,5'
- title: Alerts Firing
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: '0'
- value: 'null'
- valueName: current
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Cluster Health
- titleSize: h6
- - collapse: false
- height: 168
- panels:
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- decimals:
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 1
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: (sum(up{job="apiserver"} == 1) / count(up{job="apiserver"})) * 100
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '50,80'
- title: API Servers UP
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- decimals:
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 2
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: (sum(up{job="kube-controller-manager-discovery"} == 1) / count(up{job="kube-controller-manager-discovery"}))
- * 100
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '50,80'
- title: Controller Managers UP
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(245, 54, 54, 0.9)
- - rgba(237, 129, 40, 0.89)
- - rgba(50, 172, 45, 0.97)
- datasource: "${DS_PROMETHEUS}"
- decimals:
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 3
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: (sum(up{job="kube-scheduler-discovery"} == 1) / count(up{job="kube-scheduler-discovery"}))
- * 100
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '50,80'
- title: Schedulers UP
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- decimals:
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- hideTimeOverride: false
- id: 4
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: count(increase(kube_pod_container_status_restarts{namespace=~"kube-system|tectonic-system"}[1h])
- > 5)
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '1,3'
- title: Crashlooping Control Plane Pods
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: '0'
- value: 'null'
- valueName: current
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Control Plane Status
- titleSize: h6
- - collapse: false
- height: 158
- panels:
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 8
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: sum(100 - (avg by (instance) (rate(node_cpu{job="node-exporter",mode="idle"}[5m]))
- * 100)) / count(node_cpu{job="node-exporter",mode="idle"})
- format: time_series
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '80,90'
- title: CPU Utilization
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: avg
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 7
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: "((sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers)
- - sum(node_memory_Cached)) / sum(node_memory_MemTotal)) * 100"
- format: time_series
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '80,90'
- title: Memory Utilization
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: avg
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 9
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: (sum(node_filesystem_size{device!="rootfs"}) - sum(node_filesystem_free{device!="rootfs"}))
- / sum(node_filesystem_size{device!="rootfs"})
- format: time_series
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '80,90'
- title: Filesystem Utilization
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: avg
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 10
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: 100 - (sum(kube_node_status_capacity_pods) - sum(kube_pod_info)) / sum(kube_node_status_capacity_pods)
- * 100
- format: time_series
- intervalFactor: 2
- legendFormat: ''
- refId: A
- step: 600
- thresholds: '80,90'
- title: Pod Utilization
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: avg
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Capacity Planing
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags: []
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- time:
- from: now-6h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: ''
- title: Kubernetes Cluster Status
- version: 3
- inputs:
- - name: prometheus
- pluginId: prometheus
- type: datasource
- value: prometheus
- overwrite: true
- nginx_stats:
- __inputs:
- - name: prometheus
- label: prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.5.2
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- annotations:
- list: []
- description: Show stats from the hnlq715/nginx-vts-exporter.
- editable: true
- gnetId: 2949
- graphTooltip: 0
- hideControls: false
- id:
- links: []
- refresh: 5m
- rows:
- - collapse: false
- height: 250
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 7
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 12
- stack: false
- steppedLine: false
- targets:
- - expr: sum(nginx_upstream_responses_total{upstream=~"^$Upstream$"}) by (status_code,
- upstream)
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ status_code }}.{{ upstream }}"
- metric: nginx_upstream_response
- refId: A
- step: 4
- thresholds: []
- timeFrom:
- timeShift:
- title: HTTP Response Codes by Upstream
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Dashboard Row
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 6
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(irate(nginx_upstream_requests_total{upstream=~"^$Upstream$"}[5m]))
- by (upstream)
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ upstream }}"
- metric: nginx_upstream_requests
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Upstream Requests rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 5
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(irate(nginx_upstream_bytes_total{upstream=~"^$Upstream$"}[5m])) by
- (direction, upstream)
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ direction }}.{{ upstream }}"
- metric: nginx_upstream_bytes
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Upstream Bytes Transfer rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Dashboard Row
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 1
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(irate(nginx_connections_total[5m])) by (type)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ type }}"
- metric: nginx_server_connections
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Overall Connections rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 4
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(irate(nginx_cache_total{ server_zone=~"$ingress"}[5m])) by (server_zone,
- type)
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ type }}.{{ server_zone }}"
- metric: nginx_server_cache
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Cache Action rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Dashboard Row
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 3
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(irate(nginx_requests_total{ server_zone=~"$ingress" }[5m])) by (server_zone)
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: "{{ server_zone }}"
- metric: nginx_server_requests
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Overall Requests rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 2
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(irate(nginx_bytes_total{ server_zone=~"$ingress" }[5m])) by (direction,
- server_zone)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ direction }}.{{ server_zone }}"
- metric: nginx_server_bytes
- refId: A
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Overall Bytes Transferred rate
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Dashboard Row
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags:
- - prometheus
- - nginx
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - allValue: ".*"
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label:
- multi: true
- name: Upstream
- options: []
- query: label_values(nginx_upstream_bytes_total, upstream)
- refresh: 1
- regex: ''
- sort: 1
- tagValuesQuery: ''
- tags: []
- tagsQuery: ''
- type: query
- useTags: false
- - allValue:
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label:
- multi: true
- name: ingress
- options: []
- query: label_values(nginx_bytes_total, server_zone)
- refresh: 1
- regex: "/^[^\\*_]+$/"
- sort: 1
- tagValuesQuery: ''
- tags: []
- tagsQuery: ''
- type: query
- useTags: false
- time:
- from: now-1h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: browser
- title: Nginx Stats
- version: 13
- nodes:
- __inputs:
- - name: prometheus
- label: prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.4.1
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- annotations:
- list: []
- description: Dashboard to get an overview of one server
- editable: true
- gnetId: 22
- graphTooltip: 0
- hideControls: false
- id:
- links: []
- refresh: false
- rows:
- - collapse: false
- height: 250px
- panels:
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 3
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: 100 - (avg by (cpu) (irate(node_cpu{mode="idle", instance="$server"}[5m]))
- * 100)
- hide: false
- intervalFactor: 10
- legendFormat: "{{cpu}}"
- refId: A
- step: 50
- thresholds: []
- timeFrom:
- timeShift:
- title: Idle cpu
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: percent
- label: cpu usage
- logBase: 1
- max: 100
- min: 0
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 9
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: node_load1{instance="$server"}
- intervalFactor: 4
- legendFormat: load 1m
- refId: A
- step: 20
- target: ''
- - expr: node_load5{instance="$server"}
- intervalFactor: 4
- legendFormat: load 5m
- refId: B
- step: 20
- target: ''
- - expr: node_load15{instance="$server"}
- intervalFactor: 4
- legendFormat: load 15m
- refId: C
- step: 20
- target: ''
- thresholds: []
- timeFrom:
- timeShift:
- title: System load
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: percentunit
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 4
- legend:
- alignAsTable: false
- avg: false
- current: false
- hideEmpty: false
- hideZero: false
- max: false
- min: false
- rightSide: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: node_memory_SwapFree{instance="172.17.0.1:9100",job="prometheus"}
- yaxis: 2
- spaceLength: 10
- span: 9
- stack: true
- steppedLine: false
- targets:
- - expr: node_memory_MemTotal{instance="$server"} - node_memory_MemFree{instance="$server"}
- - node_memory_Buffers{instance="$server"} - node_memory_Cached{instance="$server"}
- hide: false
- interval: ''
- intervalFactor: 2
- legendFormat: memory used
- metric: ''
- refId: C
- step: 10
- - expr: node_memory_Buffers{instance="$server"}
- interval: ''
- intervalFactor: 2
- legendFormat: memory buffers
- metric: ''
- refId: E
- step: 10
- - expr: node_memory_Cached{instance="$server"}
- intervalFactor: 2
- legendFormat: memory cached
- metric: ''
- refId: F
- step: 10
- - expr: node_memory_MemFree{instance="$server"}
- intervalFactor: 2
- legendFormat: memory free
- metric: ''
- refId: D
- step: 10
- thresholds: []
- timeFrom:
- timeShift:
- title: Memory usage
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: percent
- gauge:
- maxValue: 100
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 5
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: ((node_memory_MemTotal{instance="$server"} - node_memory_MemFree{instance="$server"} -
- node_memory_Buffers{instance="$server"} - node_memory_Cached{instance="$server"})
- / node_memory_MemTotal{instance="$server"}) * 100
- intervalFactor: 2
- refId: A
- step: 60
- target: ''
- thresholds: 80, 90
- title: Memory usage
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: avg
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 6
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: read
- yaxis: 1
- - alias: '{instance="172.17.0.1:9100"}'
- yaxis: 2
- - alias: io time
- yaxis: 2
- spaceLength: 10
- span: 9
- stack: false
- steppedLine: false
- targets:
- - expr: sum by (instance) (rate(node_disk_bytes_read{instance="$server"}[2m]))
- hide: false
- intervalFactor: 4
- legendFormat: read
- refId: A
- step: 20
- target: ''
- - expr: sum by (instance) (rate(node_disk_bytes_written{instance="$server"}[2m]))
- intervalFactor: 4
- legendFormat: written
- refId: B
- step: 20
- - expr: sum by (instance) (rate(node_disk_io_time_ms{instance="$server"}[2m]))
- intervalFactor: 4
- legendFormat: io time
- refId: C
- step: 20
- thresholds: []
- timeFrom:
- timeShift:
- title: Disk I/O
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: ms
- label:
- logBase: 1
- max:
- min:
- show: true
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: percentunit
- gauge:
- maxValue: 1
- minValue: 0
- show: true
- thresholdLabels: false
- thresholdMarkers: true
- id: 7
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: (sum(node_filesystem_size{device!="rootfs",instance="$server"}) - sum(node_filesystem_free{device!="rootfs",instance="$server"}))
- / sum(node_filesystem_size{device!="rootfs",instance="$server"})
- intervalFactor: 2
- refId: A
- step: 60
- target: ''
- thresholds: 0.75, 0.9
- title: Disk space usage
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 8
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: 'transmitted '
- yaxis: 2
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: rate(node_network_receive_bytes{instance="$server",device!~"lo"}[5m])
- hide: false
- intervalFactor: 2
- legendFormat: "{{device}}"
- refId: A
- step: 10
- target: ''
- thresholds: []
- timeFrom:
- timeShift:
- title: Network received
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - alerting: {}
- aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 10
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: 'transmitted '
- yaxis: 2
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: rate(node_network_transmit_bytes{instance="$server",device!~"lo"}[5m])
- hide: false
- intervalFactor: 2
- legendFormat: "{{device}}"
- refId: B
- step: 10
- target: ''
- thresholds: []
- timeFrom:
- timeShift:
- title: Network transmitted
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: bytes
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: New row
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags: []
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - allValue:
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label: Server
- multi: false
- name: host
- options: []
- query: label_values(node_uname_info, nodename)
- refresh: 1
- regex: ''
- sort: 0
- tagValuesQuery: ''
- tags: []
- tagsQuery: ''
- type: query
- useTags: false
- - allValue:
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 2
- includeAll: false
- label: Instance
- multi: false
- name: server
- options: []
- query: label_values(node_uname_info{nodename="$host"}, instance)
- refresh: 1
- regex: ''
- sort: 0
- tagValuesQuery: ''
- tags: []
- tagsQuery: ''
- type: query
- useTags: false
- time:
- from: now-1h
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: browser
- title: Nodes
- version: 2
- inputs:
- - name: prometheus
- pluginId: prometheus
- type: datasource
- value: prometheus
- overwrite: true
- rabbitmq:
- __inputs:
- - name: DS_PROMETHEUS
- label: Prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.2.0
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- annotations:
- list: []
- editable: true
- gnetId: 2121
- graphTooltip: 0
- hideControls: false
- id:
- links: []
- refresh: 5m
- rows:
- - collapse: false
- height: 266
- panels:
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(50, 172, 45, 0.97)
- - rgba(237, 129, 40, 0.89)
- - rgba(245, 54, 54, 0.9)
- datasource: "${DS_PROMETHEUS}"
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 13
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 3
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- targets:
- - expr: rabbitmq_up{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- metric: rabbitmq_up{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- refId: A
- step: 2
- thresholds: Up,Down
- timeFrom: 30s
- title: RabbitMQ Server
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- - op: "="
- text: Down
- value: '0'
- - op: "="
- text: Up
- value: '1'
- valueName: current
- - alert:
- conditions:
- - evaluator:
- params:
- - 1
- type: lt
- operator:
- type: and
- query:
- params:
- - A
- - 10s
- - now
- reducer:
- params: []
- type: last
- type: query
- - evaluator:
- params: []
- type: no_value
- operator:
- type: and
- query:
- params:
- - A
- - 10s
- - now
- reducer:
- params: []
- type: last
- type: query
- executionErrorState: alerting
- frequency: 60s
- handler: 1
- message: Some of the RabbitMQ node is down
- name: Node Stats alert
- noDataState: no_data
- notifications: []
- aliasColors: {}
- bars: true
- datasource: "${DS_PROMETHEUS}"
- decimals: 0
- fill: 1
- id: 12
- legend:
- alignAsTable: true
- avg: false
- current: true
- max: false
- min: false
- show: true
- total: false
- values: true
- lines: false
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 9
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_running{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{node}}"
- metric: rabbitmq_running
- refId: A
- step: 2
- thresholds:
- - colorMode: critical
- fill: true
- line: true
- op: lt
- value: 1
- timeFrom: 30s
- timeShift:
- title: Node up Stats
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 0
- fill: 1
- id: 6
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_exchangesTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{instance}}:exchanges"
- metric: rabbitmq_exchangesTotal
- refId: A
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Exchanges
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 0
- fill: 1
- id: 4
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_channelsTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{instance}}:channels"
- metric: rabbitmq_channelsTotal
- refId: A
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Channels
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 0
- fill: 1
- id: 3
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_consumersTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{instance}}:consumers"
- metric: rabbitmq_consumersTotal
- refId: A
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Consumers
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 0
- fill: 1
- id: 5
- legend:
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_connectionsTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{instance}}:connections"
- metric: rabbitmq_connectionsTotal
- refId: A
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Connections
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 7
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_queuesTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{instance}}:queues"
- metric: rabbitmq_queuesTotal
- refId: A
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Queues
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 0
- fill: 1
- id: 8
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum by (vhost)(rabbitmq_queue_messages_ready{application="prometheus_rabbitmq_exporter",release_group="$rabbit"})
- intervalFactor: 2
- legendFormat: "{{vhost}}:ready"
- metric: rabbitmq_queue_messages_ready
- refId: A
- step: 2
- - expr: sum by (vhost)(rabbitmq_queue_messages_published_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"})
- intervalFactor: 2
- legendFormat: "{{vhost}}:published"
- metric: rabbitmq_queue_messages_published_total
- refId: B
- step: 2
- - expr: sum by (vhost)(rabbitmq_queue_messages_delivered_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"})
- intervalFactor: 2
- legendFormat: "{{vhost}}:delivered"
- metric: rabbitmq_queue_messages_delivered_total
- refId: C
- step: 2
- - expr: sum by (vhost)(rabbitmq_queue_messages_unacknowledged{application="prometheus_rabbitmq_exporter",release_group="$rabbit"})
- intervalFactor: 2
- legendFormat: "{{vhost}}:unack"
- metric: ack
- refId: D
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Messages/host
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 0
- fill: 1
- id: 2
- legend:
- alignAsTable: true
- avg: false
- current: true
- max: false
- min: false
- rightSide: false
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_queue_messages{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{queue}}:{{durable}}"
- metric: rabbitmq_queue_messages
- refId: A
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Messages / Queue
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 9
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_node_mem_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{node}}:used"
- metric: rabbitmq_node_mem_used
- refId: A
- step: 2
- - expr: rabbitmq_node_mem_limit{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{node}}:limit"
- metric: node_mem
- refId: B
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Memory
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: decbytes
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 10
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_fd_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{node}}:used"
- metric: ''
- refId: A
- step: 2
- - expr: rabbitmq_fd_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{node}}:total"
- metric: node_mem
- refId: B
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: FIle descriptors
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 11
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: rabbitmq_sockets_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{node}}:used"
- metric: ''
- refId: A
- step: 2
- - expr: rabbitmq_sockets_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}
- intervalFactor: 2
- legendFormat: "{{node}}:total"
- metric: ''
- refId: B
- step: 2
- thresholds: []
- timeFrom:
- timeShift:
- title: Sockets
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- transparent: false
- type: graph
- xaxis:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Dashboard Row
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags: []
- templating:
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - current: {}
- hide: 0
- label: null
- name: rabbit
- options: []
- type: query
- query: label_values(rabbitmq_up, release_group)
- refresh: 1
- sort: 1
- datasource: "${DS_PROMETHEUS}"
- time:
- from: now-5m
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: browser
- title: RabbitMQ Metrics
- version: 17
- description: 'Basic rabbitmq host stats: Node Stats, Exchanges, Channels, Consumers, Connections,
- Queues, Messages, Messages per Queue, Memory, File Descriptors, Sockets.'
- openstack_control_plane:
- __inputs:
- - name: prometheus
- label: prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.5.2
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- - type: panel
- id: text
- name: Text
- version: ''
- annotations:
- list: []
- editable: true
- gnetId:
- graphTooltip: 1
- hideControls: false
- id:
- links: []
- refresh: 5m
- rows:
- - collapse: false
- height: 250px
- panels:
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(200, 54, 35, 0.88)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 24
- interval: "> 60s"
- links:
- - dashboard: Openstack Service
- name: Drilldown dashboard
- params: var-Service=keystone
- title: Openstack Service
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_keystone_api{job="openstack-metrics", region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Keystone
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(200, 54, 35, 0.88)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 23
- interval: "> 60s"
- links:
- - dashboard: Openstack Service
- name: Drilldown dashboard
- params: var-Service=glance
- title: Openstack Service
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_glance_api{job="openstack-metrics", region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Glance
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(202, 58, 40, 0.86)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 22
- interval: "> 60s"
- links:
- - dashboard: Openstack Service
- name: Drilldown dashboard
- params: var-Service=heat
- title: Openstack Service
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_heat_api{job="openstack-metrics", region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Heat
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(200, 54, 35, 0.88)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 21
- interval: "> 60s"
- links:
- - dashboard: Openstack Service
- name: Drilldown dashboard
- params: var-Service=neutron
- title: Openstack Service
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_neutron_api{job="openstack-metrics", region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Neutron
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(208, 53, 34, 0.82)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 20
- interval: "> 60s"
- links:
- - dashboard: Openstack Service
- name: Drilldown dashboard
- params: var-Service=nova
- title: Openstack Service
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_nova_api{job="openstack-metrics", region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Nova
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(200, 54, 35, 0.88)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 19
- interval: "> 60s"
- links:
- - dashboard: Openstack Service
- name: Drilldown dashboard
- params: var-Service=swift
- title: Openstack Service
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_swift_api{job="openstack-metrics", region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Ceph
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(200, 54, 35, 0.88)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 18
- interval: "> 60s"
- links:
- - dashboard: Openstack Service
- name: Drilldown dashboard
- params: var-Service=cinder
- title: Openstack Service
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_cinder_api{job="openstack-metrics", region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Cinder
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(200, 54, 35, 0.88)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 17
- interval: "> 60s"
- links:
- - dashboard: Openstack Service
- name: Drilldown dashboard
- params: var-Service=placement
- title: Openstack Service
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_placement_api{job="openstack-metrics", region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Placement
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(208, 53, 34, 0.82)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 16
- interval: "> 60s"
- links:
- - dashboard: RabbitMQ Metrics
- name: Drilldown dashboard
- title: RabbitMQ Metrics
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: min(rabbitmq_up)
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: RabbitMQ
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(208, 53, 34, 0.82)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 15
- interval: "> 60s"
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: min(mysql_global_status_wsrep_ready)
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: MariaDB
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(225, 177, 40, 0.59)
- - rgba(208, 53, 34, 0.82)
- - rgba(118, 245, 40, 0.73)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 14
- interval: "> 60s"
- links:
- - dashboard: Nginx Stats
- name: Drilldown dashboard
- title: Nginx Stats
- type: dashboard
- mappingType: 2
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: '1'
- text: OK
- to: '99999999999999'
- - from: '0'
- text: CRIT
- to: '0'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: sum_over_time(nginx_connections_total{type="active", namespace="openstack"}[5m])
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '0,1'
- title: Nginx
- type: singlestat
- valueFontSize: 50%
- valueName: current
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(208, 53, 34, 0.82)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 13
- interval: "> 60s"
- links:
- - dashboard: Memcached
- name: Drilldown dashboard
- title: Memcached
- type: dashboard
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: min(memcached_up)
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '1,2'
- title: Memcached
- type: singlestat
- valueFontSize: 50%
- valueMaps:
- - op: "="
- text: no data
- value: 'null'
- - op: "="
- text: CRIT
- value: '0'
- - op: "="
- text: OK
- value: '1'
- - op: "="
- text: UNKW
- value: '2'
- valueName: current
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: OpenStack Services
- titleSize: h6
- - collapse: false
- height: 250px
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 11
- interval: "> 60s"
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 3
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - alias: free
- column: value
- expr: openstack_total_used_vcpus{job="openstack-metrics", region="$region"} + openstack_total_free_vcpus{job="openstack-metrics",
- region="$region"}
- format: time_series
- function: min
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- - alias: used
- column: value
- expr: openstack_total_used_vcpus{job="openstack-metrics", region="$region"}
- format: time_series
- function: max
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: B
- resultFormat: time_series
- step: 120
- thresholds: []
- timeFrom:
- timeShift:
- title: VCPUs (total vs used)
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 12
- interval: "> 60s"
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 3
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - alias: free
- column: value
- expr: openstack_total_used_ram_MB{job="openstack-metrics", region="$region"} + openstack_total_free_ram_MB{job="openstack-metrics",
- region="$region"}
- format: time_series
- function: mean
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- - alias: used
- column: value
- expr: openstack_total_used_ram_MB{job="openstack-metrics", region="$region"}
- format: time_series
- function: mean
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: B
- resultFormat: time_series
- step: 120
- thresholds: []
- timeFrom:
- timeShift:
- title: RAM (total vs used)
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: mbytes
- label: ''
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 13
- interval: "> 60s"
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 3
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - alias: free
- column: value
- expr: openstack_total_used_disk_GB{job="openstack-metrics", region="$region"} + openstack_total_free_disk_GB{job="openstack-metrics",
- region="$region"}
- format: time_series
- function: mean
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- - alias: used
- column: value
- expr: openstack_total_used_disk_GB{job="openstack-metrics", region="$region"}
- format: time_series
- function: mean
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: B
- resultFormat: time_series
- step: 120
- thresholds: []
- timeFrom:
- timeShift:
- title: Disk (used vs total)
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: gbytes
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes": false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 27
- interval: "> 60s"
- legend:
- alignAsTable: false
- avg: true
- current: true
- hideEmpty: true
- hideZero: false
- max: true
- min: true
- show: true
- total: false
- values: true
- lines: true
- linewidth: 4
- links: []
- nullPointMode: null
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- stack: false
- steppedLine: false
- targets:
- - alias: free
- column: value
- expr: sum(openstack_running_instances)
- format: time_series
- function: mean
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- interval: "15s"
- intervalFactor: 1
- legendFormat: "{{ running_vms }}"
- policy: default
- rawQuery: false
- refID: A
- resultFormat: time_series
- - alias: used
- column: value
- expr: sum(openstack_total_running_instances)
- format: time_series
- function: mean
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- interval: "15s"
- intervalFactor: 1
- legendFormat: "{{ total_vms }}"
- policy: default
- rawQuery: false
- refID: B
- resultFormat: time_series
- step: 120
- thresholds: []
- timeFrom:
- timeShift:
- title: OpenStack Instances
- tooltip:
- msResolution: false
- shared: true
- sort : 0
- value_type: cumulative
- transparent: true
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: none
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: false
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Virtual resources
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags: []
- templating:
- enable: true
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - allValue:
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label:
- multi: false
- name: region
- options: []
- query: label_values(openstack_exporter_cache_refresh_duration_seconds, region)
- refresh: 1
- regex: ''
- sort: 0
- tagValuesQuery: ''
- tags: []
- tagsQuery: ''
- type: query
- useTags: false
- time:
- from: now-1h
- to: now
- timepicker:
- collapse: false
- enable: true
- notice: false
- now: true
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- status: Stable
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- type: timepicker
- timezone: browser
- title: OpenStack Metrics
- version: 2
- openstack-service:
- __inputs:
- - name: prometheus
- label: prometheus
- description: ''
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.5.2
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- annotations:
- enable: true
- list: []
- editable: true
- gnetId:
- graphTooltip: 1
- hideControls: false
- id:
- links: []
- refresh: 5m
- rows:
- - collapse: false
- height: 250px
- panels:
- - cacheTimeout:
- colorBackground: true
- colorValue: false
- colors:
- - rgba(225, 177, 40, 0.59)
- - rgba(200, 54, 35, 0.88)
- - rgba(118, 245, 40, 0.73)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 6
- interval: "> 60s"
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: openstack_check_[[Service]]_api{job="openstack-metrics",region="$region"}
- fill: ''
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - 'null'
- type: fill
- groupByTags: []
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- thresholds: '0,1'
- title: ''
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: CRITICAL
- value: '0'
- - op: "="
- text: OK
- value: '1'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - rgba(200, 54, 35, 0.88)
- - rgba(118, 245, 40, 0.73)
- - rgba(225, 177, 40, 0.59)
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 13
- interval: "> 60s"
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - column: value
- condition: ''
- expr: sum(nginx_responses_total{server_zone=~"[[Service]].*", status_code="5xx",region="$region"})
- fill: ''
- format: time_series
- function: count
- groupBy:
- - interval: auto
- params:
- - auto
- type: time
- - params:
- - '0'
- type: fill
- groupby_field: ''
- interval: ''
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- step: 120
- tags: []
- thresholds: ''
- title: HTTP 5xx errors
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: '0'
- value: 'null'
- valueName: current
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 0
- grid: {}
- id: 7
- interval: ">60s"
- legend:
- alignAsTable: true
- avg: true
- current: false
- max: true
- min: true
- show: true
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 8
- stack: false
- steppedLine: false
- targets:
- - expr: sum(nginx_upstream_response_msecs_avg{upstream=~"openstack-[[Service]].*",region="$region"})
- by (upstream)
- format: time_series
- intervalFactor: 2
- refId: A
- step: 120
- thresholds: []
- timeFrom:
- timeShift:
- title: HTTP response time
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 9
- interval: "> 60s"
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: true
- targets:
- - alias: healthy
- column: value
- expr: openstack_check_[[Service]]_api{region="$region"}
- format: time_series
- function: last
- groupBy:
- - params:
- - "$interval"
- type: time
- - params:
- - '0'
- type: fill
- groupByTags: []
- intervalFactor: 2
- policy: default
- rawQuery: false
- refId: A
- resultFormat: time_series
- select: []
- step: 120
- tags: []
- thresholds: []
- timeFrom:
- timeShift:
- title: API Availability
- tooltip:
- msResolution: false
- shared: false
- sort: 0
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: none
- label: ''
- logBase: 1
- max: 1
- min: 0
- show: false
- - format: short
- logBase: 1
- max:
- min:
- show: false
- - aliasColors:
- '{status_code="2xx"}': "#629E51"
- '{status_code="5xx"}': "#BF1B00"
- bars: true
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 0
- grid: {}
- id: 8
- interval: "> 60s"
- legend:
- alignAsTable: false
- avg: false
- current: false
- hideEmpty: false
- max: false
- min: false
- rightSide: false
- show: true
- total: false
- values: false
- lines: false
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 8
- stack: true
- steppedLine: false
- targets:
- - expr: sum(nginx_responses_total{server_zone=~"[[Service]].*",region="$region"}) by (status_code)
- format: time_series
- intervalFactor: 2
- refId: A
- step: 120
- thresholds: []
- timeFrom:
- timeShift:
- title: Number of HTTP responses
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- logBase: 1
- max:
- min: 0
- show: true
- - format: short
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Service Status
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags: []
- templating:
- enable: true
- list:
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - allValue:
- current: {}
- datasource: prometheus
- hide: 0
- includeAll: false
- label: region
- multi: false
- name: region
- options: []
- query: label_values(openstack_exporter_cache_refresh_duration_seconds, region)
- refresh: 1
- regex: ''
- sort: 0
- tagValuesQuery: ''
- tags: []
- tagsQuery: ''
- type: query
- useTags: false
- - allValue:
- current:
- tags: []
- text: cinder
- value: cinder
- hide: 0
- includeAll: false
- label:
- multi: false
- name: Service
- options:
- - selected: false
- text: nova
- value: nova
- - selected: false
- text: glance
- value: glance
- - selected: false
- text: keystone
- value: keystone
- - selected: true
- text: cinder
- value: cinder
- - selected: false
- text: heat
- value: heat
- - selected: false
- text: placement
- value: placement
- - selected: false
- text: neutron
- value: neutron
- query: nova,glance,keystone,cinder,heat,placement,neutron
- type: custom
- time:
- from: now-1h
- to: now
- timepicker:
- collapse: false
- enable: true
- notice: false
- now: true
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- status: Stable
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- type: timepicker
- timezone: browser
- title: Openstack Service
- version: 4
- prometheus:
- __inputs:
- - name: DS_PROMETHEUS
- label: Prometheus
- description: Prometheus which you want to monitor
- type: datasource
- pluginId: prometheus
- pluginName: Prometheus
- __requires:
- - type: grafana
- id: grafana
- name: Grafana
- version: 4.6.0
- - type: panel
- id: graph
- name: Graph
- version: ''
- - type: datasource
- id: prometheus
- name: Prometheus
- version: 1.0.0
- - type: panel
- id: singlestat
- name: Singlestat
- version: ''
- - type: panel
- id: text
- name: Text
- version: ''
- annotations:
- list:
- - builtIn: 1
- datasource: "-- Grafana --"
- enable: true
- hide: true
- iconColor: rgba(0, 211, 255, 1)
- name: Annotations & Alerts
- type: dashboard
- - datasource: "${DS_PROMETHEUS}"
- enable: true
- expr: count(sum(up{instance="$instance"}) by (instance) < 1)
- hide: false
- iconColor: rgb(250, 44, 18)
- limit: 100
- name: downage
- showIn: 0
- step: 30s
- tagKeys: instance
- textFormat: prometheus down
- titleFormat: Downage
- type: alert
- - datasource: "${DS_PROMETHEUS}"
- enable: true
- expr: sum(changes(prometheus_config_last_reload_success_timestamp_seconds[10m]))
- by (instance)
- hide: false
- iconColor: "#fceaca"
- limit: 100
- name: Reload
- showIn: 0
- step: 5m
- tagKeys: instance
- tags: []
- titleFormat: Reload
- type: tags
- description: Dashboard for monitoring of Prometheus v2.x.x
- editable: true
- gnetId: 3681
- graphTooltip: 1
- hideControls: false
- id:
- links:
- - icon: info
- tags: []
- targetBlank: true
- title: 'Dashboard''s Github '
- tooltip: Github repo of this dashboard
- type: link
- url: https://github.com/FUSAKLA/Prometheus2-grafana-dashboard
- - icon: doc
- tags: []
- targetBlank: true
- title: Prometheus Docs
- tooltip: ''
- type: link
- url: http://prometheus.io/docs/introduction/overview/
- refresh: 5m
- rows:
- - collapse: false
- height: 161
- panels:
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - "#299c46"
- - rgba(237, 129, 40, 0.89)
- - "#bf1b00"
- datasource: "${DS_PROMETHEUS}"
- decimals: 1
- format: s
- gauge:
- maxValue: 1000000
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 41
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: time() - process_start_time_seconds{instance="$instance"}
- format: time_series
- instant: false
- intervalFactor: 2
- refId: A
- thresholds: ''
- title: Uptime
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - "#299c46"
- - rgba(237, 129, 40, 0.89)
- - "#bf1b00"
- datasource: "${DS_PROMETHEUS}"
- format: short
- gauge:
- maxValue: 1000000
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 42
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 4
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: true
- tableColumn: ''
- targets:
- - expr: prometheus_tsdb_head_series{instance="$instance"}
- format: time_series
- instant: false
- intervalFactor: 2
- refId: A
- thresholds: '500000,800000,1000000'
- title: Total count of time series
- type: singlestat
- valueFontSize: 150%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - "#299c46"
- - rgba(237, 129, 40, 0.89)
- - "#d44a3a"
- datasource: "${DS_PROMETHEUS}"
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 48
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: version
- targets:
- - expr: prometheus_build_info{instance="$instance"}
- format: table
- instant: true
- intervalFactor: 2
- refId: A
- thresholds: ''
- title: Version
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: avg
- - cacheTimeout:
- colorBackground: false
- colorValue: false
- colors:
- - "#299c46"
- - rgba(237, 129, 40, 0.89)
- - "#d44a3a"
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- format: ms
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 49
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 2
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: prometheus_tsdb_head_max_time{instance="$instance"} - prometheus_tsdb_head_min_time{instance="$instance"}
- format: time_series
- instant: true
- intervalFactor: 2
- refId: A
- thresholds: ''
- title: Actual head block length
- type: singlestat
- valueFontSize: 80%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: current
- - content:
- height: ''
- id: 50
- links: []
- mode: html
- span: 1
- title: ''
- transparent: true
- type: text
- - cacheTimeout:
- colorBackground: false
- colorValue: true
- colors:
- - "#e6522c"
- - rgba(237, 129, 40, 0.89)
- - "#299c46"
- datasource: "${DS_PROMETHEUS}"
- decimals: 1
- format: none
- gauge:
- maxValue: 100
- minValue: 0
- show: false
- thresholdLabels: false
- thresholdMarkers: true
- id: 52
- interval:
- links: []
- mappingType: 1
- mappingTypes:
- - name: value to text
- value: 1
- - name: range to text
- value: 2
- maxDataPoints: 100
- nullPointMode: connected
- nullText:
- postfix: ''
- postfixFontSize: 50%
- prefix: ''
- prefixFontSize: 50%
- rangeMaps:
- - from: 'null'
- text: N/A
- to: 'null'
- span: 1
- sparkline:
- fillColor: rgba(31, 118, 189, 0.18)
- full: false
- lineColor: rgb(31, 120, 193)
- show: false
- tableColumn: ''
- targets:
- - expr: '2'
- format: time_series
- intervalFactor: 2
- refId: A
- thresholds: '10,20'
- title: ''
- transparent: true
- type: singlestat
- valueFontSize: 200%
- valueMaps:
- - op: "="
- text: N/A
- value: 'null'
- valueName: avg
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Header instance info
- titleSize: h6
- - collapse: false
- height: '250'
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 15
- legend:
- avg: true
- current: false
- max: false
- min: false
- show: false
- total: false
- values: true
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: true
- steppedLine: false
- targets:
- - expr: max(prometheus_engine_query_duration_seconds{instance="$instance"}) by
- (instance, slice)
- format: time_series
- intervalFactor: 1
- legendFormat: max duration for {{slice}}
- metric: prometheus_local_storage_rushed_mode
- refId: A
- step: 900
- thresholds: []
- timeFrom:
- timeShift:
- title: Query elapsed time
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- label: ''
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 17
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(prometheus_tsdb_head_series_created_total{instance="$instance"}[$aggregation_interval]))
- by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: created on {{ instance }}
- metric: prometheus_local_storage_maintain_series_duration_seconds_count
- refId: A
- step: 1800
- - expr: sum(increase(prometheus_tsdb_head_series_removed_total{instance="$instance"}[$aggregation_interval]))
- by (instance) * -1
- format: time_series
- intervalFactor: 2
- legendFormat: removed on {{ instance }}
- refId: B
- thresholds: []
- timeFrom:
- timeShift:
- title: Head series created/deleted
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 13
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(prometheus_target_scrapes_exceeded_sample_limit_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: exceeded_sample_limit on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: A
- step: 1800
- - expr: sum(increase(prometheus_target_scrapes_sample_duplicate_timestamp_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: duplicate_timestamp on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: B
- step: 1800
- - expr: sum(increase(prometheus_target_scrapes_sample_out_of_bounds_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: out_of_bounds on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: C
- step: 1800
- - expr: sum(increase(prometheus_target_scrapes_sample_out_of_order_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: out_of_order on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: D
- step: 1800
- - expr: sum(increase(prometheus_rule_evaluation_failures_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: rule_evaluation_failure on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: G
- step: 1800
- - expr: sum(increase(prometheus_tsdb_compactions_failed_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: tsdb_compactions_failed on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: K
- step: 1800
- - expr: sum(increase(prometheus_tsdb_reloads_failures_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: tsdb_reloads_failures on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: L
- step: 1800
- - expr: sum(increase(prometheus_tsdb_head_series_not_found{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: head_series_not_found on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: N
- step: 1800
- - expr: sum(increase(prometheus_evaluator_iterations_missed_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: evaluator_iterations_missed on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: O
- step: 1800
- - expr: sum(increase(prometheus_evaluator_iterations_skipped_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: evaluator_iterations_skipped on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: P
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Prometheus errors
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: false
- title: Main info
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- description: ''
- editable: true
- error: false
- fill: 1
- grid: {}
- id: 25
- legend:
- alignAsTable: true
- avg: true
- current: true
- max: true
- min: false
- show: false
- sort: max
- sortDesc: true
- total: false
- values: true
- lines: true
- linewidth: 2
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: prometheus_target_interval_length_seconds{instance="$instance",quantile="0.99"}
- - 60
- format: time_series
- interval: 2m
- intervalFactor: 1
- legendFormat: "{{instance}}"
- metric: ''
- refId: A
- step: 300
- thresholds: []
- timeFrom:
- timeShift:
- title: Scrape delay (counts with 1m scrape interval)
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: cumulative
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- logBase: 1
- max:
- min:
- show: true
- - format: short
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 14
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: Queue length
- yaxis: 2
- spaceLength: 10
- span: 6
- stack: false
- steppedLine: false
- targets:
- - expr: sum(prometheus_evaluator_duration_seconds{instance="$instance"}) by (instance,
- quantile)
- format: time_series
- intervalFactor: 2
- legendFormat: Queue length
- metric: prometheus_local_storage_indexing_queue_length
- refId: B
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Rule evaulation duration
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Scrape & rule duration
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 18
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(http_requests_total{instance="$instance"}[$aggregation_interval]))
- by (instance, handler) > 0
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ handler }} on {{ instance }}"
- metric: ''
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Request count
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: none
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 16
- legend:
- avg: false
- current: false
- hideEmpty: true
- hideZero: true
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: max(sum(http_request_duration_microseconds{instance="$instance"}) by (instance,
- handler, quantile)) by (instance, handler) > 0
- format: time_series
- hide: false
- intervalFactor: 2
- legendFormat: "{{ handler }} on {{ instance }}"
- refId: B
- thresholds: []
- timeFrom:
- timeShift:
- title: Request duration per handler
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: µs
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 19
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(http_request_size_bytes{instance="$instance", quantile="0.99"}[$aggregation_interval]))
- by (instance, handler) > 0
- format: time_series
- hide: false
- intervalFactor: 2
- legendFormat: "{{ handler }} in {{ instance }}"
- refId: B
- thresholds: []
- timeFrom:
- timeShift:
- title: Request size by handler
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Allocated bytes: "#F9BA8F"
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max count collector: "#bf1b00"
- Max count harvester: "#bf1b00"
- Max to persist: "#3F6833"
- RSS: "#890F02"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 8
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/Max.*/"
- fill: 0
- linewidth: 2
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(prometheus_engine_queries{instance="$instance"}) by (instance, handler)
- format: time_series
- intervalFactor: 2
- legendFormat: 'Current count '
- metric: last
- refId: A
- step: 1800
- - expr: sum(prometheus_engine_queries_concurrent_max{instance="$instance"}) by
- (instance, handler)
- format: time_series
- intervalFactor: 2
- legendFormat: Max count
- metric: last
- refId: B
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Cont of concurent queries
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Requests & queries
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors:
- Alert queue capacity on o collector: "#bf1b00"
- Alert queue capacity on o harvester: "#bf1b00"
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 20
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/.*capacity.*/"
- fill: 0
- linewidth: 2
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(prometheus_notifications_queue_capacity{instance="$instance"})by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: 'Alert queue capacity '
- metric: prometheus_local_storage_checkpoint_last_size_bytes
- refId: A
- step: 1800
- - expr: sum(prometheus_notifications_queue_length{instance="$instance"})by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: 'Alert queue size on '
- metric: prometheus_local_storage_checkpoint_last_size_bytes
- refId: B
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Alert queue size
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 21
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(prometheus_notifications_alertmanagers_discovered{instance="$instance"})
- by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: Checkpoint chunks written/s
- metric: prometheus_local_storage_checkpoint_series_chunks_written_sum
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Count of discovered alertmanagers
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: none
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 39
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(prometheus_notifications_dropped_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: notifications_dropped on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: F
- step: 1800
- - expr: sum(increase(prometheus_rule_evaluation_failures_total{rule_type="alerting",instance="$instance"}[$aggregation_interval]))
- by (rule_type,instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: rule_evaluation_failures on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Alerting errors
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Alerting
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 45
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: true
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: increase(prometheus_target_sync_length_seconds_count{scrape_job="kubernetes-service-endpoints"}[$aggregation_interval])
- format: time_series
- intervalFactor: 2
- legendFormat: Count of target synces
- refId: A
- step: 240
- thresholds: []
- timeFrom:
- timeShift:
- title: Kubernetes SD sync count
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 46
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(prometheus_target_scrapes_exceeded_sample_limit_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: exceeded_sample_limit on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: A
- step: 1800
- - expr: sum(increase(prometheus_sd_file_read_errors_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- interval: ''
- intervalFactor: 2
- legendFormat: sd_file_read_error on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: E
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Service discovery errors
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Service discovery
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 36
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(prometheus_tsdb_reloads_total{instance="$instance"}[30m]))
- by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ instance }}"
- refId: A
- thresholds: []
- timeFrom:
- timeShift:
- title: Reloaded block from disk
- tooltip:
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 5
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(prometheus_tsdb_blocks_loaded{instance="$instance"}) by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: Loaded data blocks
- metric: prometheus_local_storage_memory_chunkdescs
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Loaded data blocks
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 3
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: prometheus_tsdb_head_series{instance="$instance"}
- format: time_series
- intervalFactor: 2
- legendFormat: Time series count
- metric: prometheus_local_storage_memory_series
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Time series total count
- tooltip:
- msResolution: false
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 1
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(prometheus_tsdb_head_samples_appended_total{instance="$instance"}[$aggregation_interval]))
- by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: samples/s {{instance}}
- metric: prometheus_local_storage_ingested_samples_total
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Samples Appended per second
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label: ''
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: TSDB stats
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- To persist: "#9AC48A"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 2
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/Max.*/"
- fill: 0
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(prometheus_tsdb_head_chunks{instance="$instance"}) by (instance)
- format: time_series
- hide: false
- intervalFactor: 2
- legendFormat: Head chunk count
- metric: prometheus_local_storage_memory_chunks
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Head chunks count
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 35
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: max(prometheus_tsdb_head_max_time{instance="$instance"}) by (instance)
- - min(prometheus_tsdb_head_min_time{instance="$instance"}) by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ instance }}"
- refId: A
- thresholds: []
- timeFrom:
- timeShift:
- title: Length of head block
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: ms
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 4
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(prometheus_tsdb_head_chunks_created_total{instance="$instance"}[$aggregation_interval]))
- by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: created on {{ instance }}
- refId: B
- - expr: sum(rate(prometheus_tsdb_head_chunks_removed_total{instance="$instance"}[$aggregation_interval]))
- by (instance) * -1
- format: time_series
- intervalFactor: 2
- legendFormat: deleted on {{ instance }}
- refId: C
- thresholds: []
- timeFrom:
- timeShift:
- title: Head Chunks Created/Deleted per second
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Head block stats
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 33
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(prometheus_tsdb_compaction_duration_sum{instance="$instance"}[30m])
- / increase(prometheus_tsdb_compaction_duration_count{instance="$instance"}[30m]))
- by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ instance }}"
- refId: B
- thresholds: []
- timeFrom:
- timeShift:
- title: Compaction duration
- tooltip:
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 34
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(prometheus_tsdb_head_gc_duration_seconds{instance="$instance"}) by
- (instance, quantile)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ quantile }} on {{ instance }}"
- refId: A
- thresholds: []
- timeFrom:
- timeShift:
- title: Go Garbage collection duration
- tooltip:
- shared: true
- sort: 0
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 37
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(prometheus_tsdb_wal_truncate_duration_seconds{instance="$instance"})
- by (instance, quantile)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ quantile }} on {{ instance }}"
- refId: A
- thresholds: []
- timeFrom:
- timeShift:
- title: WAL truncate duration seconds
- tooltip:
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- fill: 1
- id: 38
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: connected
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 3
- stack: false
- steppedLine: false
- targets:
- - expr: sum(tsdb_wal_fsync_duration_seconds{instance="$instance"}) by (instance,
- quantile)
- format: time_series
- intervalFactor: 2
- legendFormat: "{{ quantile }} {{ instance }}"
- refId: A
- thresholds: []
- timeFrom:
- timeShift:
- title: WAL fsync duration seconds
- tooltip:
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: s
- label:
- logBase: 1
- max:
- min:
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Data maintenance
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors:
- Allocated bytes: "#7EB26D"
- Allocated bytes - 1m max: "#BF1B00"
- Allocated bytes - 1m min: "#BF1B00"
- Allocated bytes - 5m max: "#BF1B00"
- Allocated bytes - 5m min: "#BF1B00"
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- RSS: "#447EBC"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- decimals:
- editable: true
- error: false
- fill: 1
- id: 6
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides:
- - alias: "/-/"
- fill: 0
- - alias: collector heap size
- color: "#E0752D"
- fill: 0
- linewidth: 2
- - alias: collector kubernetes memory limit
- color: "#BF1B00"
- fill: 0
- linewidth: 3
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(process_resident_memory_bytes{instance="$instance"}) by (instance)
- format: time_series
- hide: false
- intervalFactor: 2
- legendFormat: Total resident memory - {{instance}}
- metric: process_resident_memory_bytes
- refId: B
- step: 1800
- - expr: sum(go_memstats_alloc_bytes{instance="$instance"}) by (instance)
- format: time_series
- hide: false
- intervalFactor: 2
- legendFormat: Total llocated bytes - {{instance}}
- metric: go_memstats_alloc_bytes
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Memory
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors:
- Allocated bytes: "#F9BA8F"
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- RSS: "#890F02"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 7
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: rate(go_memstats_alloc_bytes_total{instance="$instance"}[$aggregation_interval])
- format: time_series
- intervalFactor: 2
- legendFormat: Allocated Bytes/s
- metric: go_memstats_alloc_bytes
- refId: A
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Allocations per second
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: bytes
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- - aliasColors: {}
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- decimals: 2
- editable: true
- error: false
- fill: 1
- id: 9
- legend:
- alignAsTable: false
- avg: false
- current: false
- hideEmpty: false
- max: false
- min: false
- rightSide: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 4
- stack: false
- steppedLine: false
- targets:
- - expr: sum(rate(process_cpu_seconds_total{instance="$instance"}[$aggregation_interval]))
- by (instance)
- format: time_series
- intervalFactor: 2
- legendFormat: CPU/s
- metric: prometheus_local_storage_ingested_samples_total
- refId: B
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: CPU per second
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values:
- - avg
- yaxes:
- - format: none
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: RAM&CPU
- titleSize: h6
- - collapse: false
- height: 250
- panels:
- - aliasColors:
- Chunks: "#1F78C1"
- Chunks to persist: "#508642"
- Max chunks: "#052B51"
- Max to persist: "#3F6833"
- bars: false
- dashLength: 10
- dashes: false
- datasource: "${DS_PROMETHEUS}"
- editable: true
- error: false
- fill: 1
- id: 47
- legend:
- avg: false
- current: false
- max: false
- min: false
- show: false
- total: false
- values: false
- lines: true
- linewidth: 1
- links: []
- nullPointMode: 'null'
- percentage: false
- pointradius: 5
- points: false
- renderer: flot
- seriesOverrides: []
- spaceLength: 10
- span: 12
- stack: false
- steppedLine: false
- targets:
- - expr: sum(increase(net_conntrack_dialer_conn_failed_total{instance="$instance"}[$aggregation_interval]))
- by (instance) > 0
- format: time_series
- hide: false
- interval: ''
- intervalFactor: 2
- legendFormat: conntrack_dialer_conn_failed on {{ instance }}
- metric: prometheus_local_storage_chunk_ops_total
- refId: M
- step: 1800
- thresholds: []
- timeFrom:
- timeShift:
- title: Net errors
- tooltip:
- msResolution: false
- shared: true
- sort: 2
- value_type: individual
- type: graph
- xaxis:
- buckets:
- mode: time
- name:
- show: true
- values: []
- yaxes:
- - format: short
- label:
- logBase: 1
- max:
- min: '0'
- show: true
- - format: short
- label:
- logBase: 1
- max:
- min:
- show: true
- repeat:
- repeatIteration:
- repeatRowId:
- showTitle: true
- title: Contrac errors
- titleSize: h6
- schemaVersion: 14
- style: dark
- tags:
- - prometheus
- templating:
- list:
- - auto: true
- auto_count: 30
- auto_min: 2m
- current:
- text: auto
- value: "$__auto_interval"
- hide: 0
- label: aggregation intarval
- name: aggregation_interval
- options:
- - selected: true
- text: auto
- value: "$__auto_interval"
- - selected: false
- text: 1m
- value: 1m
- - selected: false
- text: 10m
- value: 10m
- - selected: false
- text: 30m
- value: 30m
- - selected: false
- text: 1h
- value: 1h
- - selected: false
- text: 6h
- value: 6h
- - selected: false
- text: 12h
- value: 12h
- - selected: false
- text: 1d
- value: 1d
- - selected: false
- text: 7d
- value: 7d
- - selected: false
- text: 14d
- value: 14d
- - selected: false
- text: 30d
- value: 30d
- query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d
- refresh: 2
- type: interval
- - allValue:
- current: {}
- datasource: "${DS_PROMETHEUS}"
- hide: 0
- includeAll: false
- label: Instance
- multi: false
- name: instance
- options: []
- query: label_values(prometheus_build_info, instance)
- refresh: 2
- regex: ''
- sort: 2
- tagValuesQuery: ''
- tags: []
- tagsQuery: ''
- type: query
- useTags: false
- - current:
- text: Prometheus
- value: Prometheus
- hide: 0
- label: Prometheus datasource
- name: DS_PROMETHEUS
- options: []
- query: prometheus
- refresh: 1
- regex: ''
- type: datasource
- - current:
- text: influxdb(heapster) - kokura
- value: influxdb(heapster) - kokura
- hide: 0
- label: InfluxDB datasource
- name: influx_datasource
- options: []
- query: influxdb
- refresh: 1
- regex: ''
- type: datasource
- time:
- from: now-7d
- to: now
- timepicker:
- refresh_intervals:
- - 5s
- - 10s
- - 30s
- - 1m
- - 5m
- - 15m
- - 30m
- - 1h
- - 2h
- - 1d
- time_options:
- - 5m
- - 15m
- - 1h
- - 6h
- - 12h
- - 24h
- - 2d
- - 7d
- - 30d
- timezone: browser
- title: Prometheus2.0 (v1.0.0 by FUSAKLA)
- version: 8
+ home_dashboard: |-
+ {
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 66,
+ "links": [],
+ "panels": [
+ {
+ "content": "
\n ATT Home Dashboard\n
\n\n AT&T Proprietary (Internal Use Only)\n
",
+ "editable": true,
+ "gridPos": {
+ "h": 3,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 1,
+ "links": [],
+ "mode": "html",
+ "options": {},
+ "style": {},
+ "title": "",
+ "transparent": true,
+ "type": "text"
+ },
+ {
+ "folderId": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 13,
+ "x": 6,
+ "y": 3
+ },
+ "headings": true,
+ "id": 3,
+ "limit": 30,
+ "links": [],
+ "options": {},
+ "query": "",
+ "recent": true,
+ "search": false,
+ "starred": true,
+ "tags": [],
+ "title": "",
+ "type": "dashlist"
+ }
+ ],
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": []
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "hidden": true,
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ],
+ "type": "timepicker"
+ },
+ "timezone": "browser",
+ "title": "OSH Home",
+ "version": 1
+ }
+ ceph_cluster: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Ceph Cluster overview.\r\n",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": 917,
+ "graphTooltip": 0,
+ "id": 134,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 35,
+ "panels": [],
+ "title": "New row",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 21,
+ "interval": "1m",
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "avg(ceph_health_status{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Status",
+ "type": "singlestat",
+ "valueFontSize": "100%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "HEALTHY",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "WARNING",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 22,
+ "interval": "1m",
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "count(ceph_pool_max_avail{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "",
+ "title": "Pools",
+ "type": "singlestat",
+ "valueFontSize": "100%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "bytes",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 8,
+ "y": 1
+ },
+ "id": 33,
+ "interval": "1m",
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "avg(ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "0.025,0.1",
+ "title": "Cluster Capacity",
+ "type": "singlestat",
+ "valueFontSize": "100%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "bytes",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 12,
+ "y": 1
+ },
+ "id": 34,
+ "interval": "1m",
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "avg(ceph_cluster_total_used_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "0.025,0.1",
+ "title": "Used Capacity",
+ "type": "singlestat",
+ "valueFontSize": "100%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "percentunit",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 16,
+ "y": 1
+ },
+ "id": 23,
+ "interval": "1m",
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "avg(ceph_cluster_total_used_bytes/ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "70,80",
+ "title": "Current Utilization",
+ "type": "singlestat",
+ "valueFontSize": "100%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {
+ "Available": "#EAB839",
+ "Total Capacity": "#447EBC",
+ "Used": "#BF1B00",
+ "total_avail": "#6ED0E0",
+ "total_space": "#7EB26D",
+ "total_used": "#890F02"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 5,
+ "grid": {},
+ "gridPos": {
+ "h": 8,
+ "w": 8,
+ "x": 0,
+ "y": 5
+ },
+ "height": "300",
+ "id": 39,
+ "interval": "",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 5,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "ceph_health_status{application=\"ceph\",component=\"manager\",instance=\"172.29.0.26:9283\",job=\"ceph-mgr\",namespace=\"ceph\",release_group=\"clcp-ucp-ceph-client\"}",
+ "fill": 0,
+ "linewidth": 3,
+ "stack": false
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "ceph_health_status{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "ceph-health",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cluster Status (0-Healthy, 1-Warning, 2-Critical)",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "columns": [
+ {
+ "text": "Current",
+ "value": "current"
+ }
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "fontSize": "100%",
+ "gridPos": {
+ "h": 8,
+ "w": 8,
+ "x": 8,
+ "y": 5
+ },
+ "id": 40,
+ "links": [],
+ "options": {},
+ "pageSize": null,
+ "scroll": true,
+ "showHeader": true,
+ "sort": {
+ "col": 0,
+ "desc": true
+ },
+ "styles": [
+ {
+ "alias": "Time",
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "pattern": "Time",
+ "type": "date"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "decimals": 2,
+ "pattern": "/.*/",
+ "thresholds": [],
+ "type": "number",
+ "unit": "short"
+ }
+ ],
+ "targets": [
+ {
+ "expr": "ceph_mgr_status{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{job}} {{ceph_daemon}}",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "timeFrom": null,
+ "timeShift": null,
+ "title": "Cluster Manager",
+ "transform": "timeseries_aggregations",
+ "type": "table"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 13
+ },
+ "id": 36,
+ "panels": [],
+ "title": "New row",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 2,
+ "x": 0,
+ "y": 14
+ },
+ "id": 26,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(ceph_osd_in{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "",
+ "title": "OSDs IN",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 40, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 2,
+ "x": 2,
+ "y": 14
+ },
+ "id": 27,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}) - sum(ceph_osd_in{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "OSDs OUT",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 2,
+ "x": 4,
+ "y": 14
+ },
+ "id": 28,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(ceph_osd_up{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "",
+ "title": "OSDs UP",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 40, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 2,
+ "x": 6,
+ "y": 14
+ },
+ "id": 29,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}) - sum(ceph_osd_up{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "OSDs DOWN",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 8,
+ "y": 14
+ },
+ "id": 30,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "avg(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "250,300",
+ "title": "Average PGs per OSD",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 17
+ },
+ "id": 37,
+ "panels": [],
+ "repeat": null,
+ "title": "CLUSTER",
+ "type": "row"
+ },
+ {
+ "aliasColors": {
+ "Available": "#EAB839",
+ "Total Capacity": "#447EBC",
+ "Used": "#BF1B00",
+ "total_avail": "#6ED0E0",
+ "total_space": "#7EB26D",
+ "total_used": "#890F02"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 4,
+ "grid": {},
+ "gridPos": {
+ "h": 8,
+ "w": 8,
+ "x": 0,
+ "y": 18
+ },
+ "height": "300",
+ "id": 1,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 0,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "Total Capacity",
+ "fill": 0,
+ "linewidth": 3,
+ "stack": false
+ }
+ ],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"} - ceph_cluster_total_used_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Available",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "ceph_cluster_total_used_bytes{nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Used",
+ "refId": "B",
+ "step": 60
+ },
+ {
+ "expr": "ceph_cluster_total_bytes{nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Total Capacity",
+ "refId": "C",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Capacity",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Total Capacity": "#7EB26D",
+ "Used": "#BF1B00",
+ "total_avail": "#6ED0E0",
+ "total_space": "#7EB26D",
+ "total_used": "#890F02"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 8,
+ "w": 8,
+ "x": 8,
+ "y": 18
+ },
+ "height": "300",
+ "id": 3,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(ceph_osd_op_w{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Write",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_osd_op_r{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Read",
+ "refId": "B",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "IOPS",
+ "tooltip": {
+ "msResolution": true,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 8,
+ "w": 8,
+ "x": 16,
+ "y": 18
+ },
+ "height": "300",
+ "id": 7,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(ceph_osd_op_in_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Write",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_osd_op_out_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Read",
+ "refId": "B",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Throughput",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 26
+ },
+ "id": 38,
+ "panels": [],
+ "title": "New row",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 27
+ },
+ "id": 18,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/^Total.*$/",
+ "stack": false
+ }
+ ],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(ceph_pool_objects{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Total",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Objects in the Cluster",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 1,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 34
+ },
+ "id": 19,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/^Total.*$/",
+ "stack": false
+ }
+ ],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Total",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_pg_active{application=\"ceph\",release_group=\"$ceph_cluster\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Active",
+ "refId": "B",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_pg_inconsistent{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Inconsistent",
+ "refId": "C",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_pg_creating{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Creating",
+ "refId": "D",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_pg_recovering{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Recovering",
+ "refId": "E",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_pg_down{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Down",
+ "refId": "F",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "PGs",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 1,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 34
+ },
+ "id": 20,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/^Total.*$/",
+ "stack": false
+ }
+ ],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(ceph_pg_degraded{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Degraded",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_pg_stale{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Stale",
+ "refId": "B",
+ "step": 60
+ },
+ {
+ "expr": "sum(ceph_pg_undersized{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Undersized",
+ "refId": "C",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Stuck PGs",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 1,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "ceph",
+ "cluster"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Cluster",
+ "multi": false,
+ "name": "ceph_cluster",
+ "options": [],
+ "query": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 2,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "auto": true,
+ "auto_count": 10,
+ "auto_min": "1m",
+ "current": {
+ "text": "1m",
+ "value": "1m"
+ },
+ "datasource": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "Interval",
+ "multi": false,
+ "name": "interval",
+ "options": [
+ {
+ "selected": false,
+ "text": "auto",
+ "value": "$__auto_interval_interval"
+ },
+ {
+ "selected": true,
+ "text": "1m",
+ "value": "1m"
+ },
+ {
+ "selected": false,
+ "text": "10m",
+ "value": "10m"
+ },
+ {
+ "selected": false,
+ "text": "30m",
+ "value": "30m"
+ },
+ {
+ "selected": false,
+ "text": "1h",
+ "value": "1h"
+ },
+ {
+ "selected": false,
+ "text": "6h",
+ "value": "6h"
+ },
+ {
+ "selected": false,
+ "text": "12h",
+ "value": "12h"
+ },
+ {
+ "selected": false,
+ "text": "1d",
+ "value": "1d"
+ },
+ {
+ "selected": false,
+ "text": "7d",
+ "value": "7d"
+ },
+ {
+ "selected": false,
+ "text": "14d",
+ "value": "14d"
+ },
+ {
+ "selected": false,
+ "text": "30d",
+ "value": "30d"
+ }
+ ],
+ "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d",
+ "refresh": 2,
+ "skipUrlSync": false,
+ "type": "interval"
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Ceph - Cluster",
+ "uid": "ceph-cluster",
+ "version": 2
+ }
+ ceph_osd: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "Prometheus.IO",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "CEPH OSD Status.",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": 923,
+ "graphTooltip": 0,
+ "id": 140,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 11,
+ "panels": [],
+ "title": "New row",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 40, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 2,
+ "x": 0,
+ "y": 1
+ },
+ "id": 6,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 2,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ },
+ {
+ "from": "0",
+ "text": "DOWN",
+ "to": "0.99"
+ },
+ {
+ "from": "0.99",
+ "text": "UP",
+ "to": "1"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "ceph_osd_up{ceph_daemon=\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "0,1",
+ "timeFrom": null,
+ "title": "Status",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "DOWN",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "UP",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 40, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 2,
+ "x": 2,
+ "y": 1
+ },
+ "id": 8,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 2,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ },
+ {
+ "from": "0",
+ "text": "OUT",
+ "to": "0.99"
+ },
+ {
+ "from": "0.99",
+ "text": "IN",
+ "to": "1"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "ceph_osd_in{ceph_daemon=\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "0,1",
+ "timeFrom": null,
+ "title": "Available",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "DOWN",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "UP",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 2,
+ "x": 4,
+ "y": 1
+ },
+ "id": 10,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 2,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "count(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "0,1",
+ "timeFrom": null,
+ "title": "Total OSDs",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "DOWN",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "UP",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 4
+ },
+ "id": 12,
+ "panels": [],
+ "title": "OSD: $osd",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 20,
+ "x": 0,
+ "y": 5
+ },
+ "id": 5,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/^Average.*/",
+ "fill": 0,
+ "stack": false
+ }
+ ],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "ceph_osd_numpg{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Number of PGs - {{ $osd }}",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "avg(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Average Number of PGs in the Cluster",
+ "refId": "B",
+ "step": 60
+ }
+ ],
+ "thresholds": [
+ {
+ "colorMode": "custom",
+ "line": true,
+ "lineColor": "rgba(216, 200, 27, 0.27)",
+ "op": "gt",
+ "value": 250
+ },
+ {
+ "colorMode": "custom",
+ "line": true,
+ "lineColor": "rgba(234, 112, 112, 0.22)",
+ "op": "gt",
+ "value": 300
+ }
+ ],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "PGs",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 20,
+ "y": 5
+ },
+ "id": 7,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "(ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}/ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})*100",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "60,80",
+ "timeFrom": null,
+ "title": "Utilization",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 12
+ },
+ "id": 13,
+ "panels": [],
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 13
+ },
+ "id": 2,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Used - {{ osd.$osd }}",
+ "metric": "ceph_osd_used_bytes",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"} - ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "hide": false,
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Available - {{ $osd }}",
+ "metric": "ceph_osd_avail_bytes",
+ "refId": "B",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "OSD Storage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 5,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 13
+ },
+ "id": 9,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": false,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": true,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "(ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}/ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "Available - {{ $osd }}",
+ "metric": "ceph_osd_avail_bytes",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Utilization Variance",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "none",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": false,
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "ceph",
+ "osd"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Cluster",
+ "multi": false,
+ "name": "ceph_cluster",
+ "options": [],
+ "query": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 2,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "auto": true,
+ "auto_count": 10,
+ "auto_min": "1m",
+ "current": {
+ "text": "1m",
+ "value": "1m"
+ },
+ "datasource": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "Interval",
+ "multi": false,
+ "name": "interval",
+ "options": [
+ {
+ "selected": false,
+ "text": "auto",
+ "value": "$__auto_interval_interval"
+ },
+ {
+ "selected": true,
+ "text": "1m",
+ "value": "1m"
+ },
+ {
+ "selected": false,
+ "text": "10m",
+ "value": "10m"
+ },
+ {
+ "selected": false,
+ "text": "30m",
+ "value": "30m"
+ },
+ {
+ "selected": false,
+ "text": "1h",
+ "value": "1h"
+ },
+ {
+ "selected": false,
+ "text": "6h",
+ "value": "6h"
+ },
+ {
+ "selected": false,
+ "text": "12h",
+ "value": "12h"
+ },
+ {
+ "selected": false,
+ "text": "1d",
+ "value": "1d"
+ },
+ {
+ "selected": false,
+ "text": "7d",
+ "value": "7d"
+ },
+ {
+ "selected": false,
+ "text": "14d",
+ "value": "14d"
+ },
+ {
+ "selected": false,
+ "text": "30d",
+ "value": "30d"
+ }
+ ],
+ "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d",
+ "refresh": 2,
+ "skipUrlSync": false,
+ "type": "interval"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "OSD",
+ "multi": false,
+ "name": "osd",
+ "options": [],
+ "query": "label_values(ceph_osd_metadata{release_group=\"$ceph_cluster\"}, ceph_daemon)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-30m",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Ceph - OSD",
+ "uid": "ceph-osd",
+ "version": 2
+ }
+ ceph_pool: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "Prometheus.IO",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Ceph Pools dashboard.",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 143,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 11,
+ "panels": [],
+ "title": "Pool: $pool",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 4,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 20,
+ "x": 0,
+ "y": 1
+ },
+ "height": "",
+ "id": 2,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 0,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/^Total.*$/",
+ "fill": 0,
+ "linewidth": 4,
+ "stack": false
+ },
+ {
+ "alias": "/^Raw.*$/",
+ "color": "#BF1B00",
+ "fill": 0,
+ "linewidth": 4
+ }
+ ],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Total - {{ $pool }}",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "ceph_pool_stored{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Used - {{ $pool }}",
+ "refId": "B",
+ "step": 60
+ },
+ {
+ "expr": "ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"} - ceph_pool_stored{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Available - {{ $pool }}",
+ "refId": "C",
+ "step": 60
+ },
+ {
+ "expr": "ceph_pool_raw_bytes_used{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Raw - {{ $pool }}",
+ "refId": "D",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "[[pool_name]] Pool Storage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "percentunit",
+ "gauge": {
+ "maxValue": 1,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 20,
+ "y": 1
+ },
+ "id": 10,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "(ceph_pool_stored{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"} / ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": "",
+ "title": "[[pool_name]] Pool Usage",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 8
+ },
+ "id": 12,
+ "panels": [],
+ "title": "New row",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 9
+ },
+ "height": "",
+ "id": 7,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "ceph_pool_objects{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Objects - {{ $pool_name }}",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "ceph_pool_dirty{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Dirty Objects - {{ $pool_name }}",
+ "refId": "B",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Objects in Pool [[pool_name]]",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 9
+ },
+ "id": 4,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "irate(ceph_pool_rd{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}[3m])",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Read - {{ $pool_name }}",
+ "refId": "B",
+ "step": 60
+ },
+ {
+ "expr": "irate(ceph_pool_wr{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}[3m])",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Write - {{ $pool_name }}",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "[[pool_name]] Pool IOPS",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "IOPS",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": "IOPS",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 16
+ },
+ "id": 5,
+ "interval": "$interval",
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "irate(ceph_pool_rd_bytes{pool_id=\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}[3m])",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Read Bytes - {{ $pool_name }}",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "irate(ceph_pool_wr_bytes{pool_id=\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}[3m])",
+ "format": "time_series",
+ "interval": "$interval",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Written Bytes - {{ $pool_name }}",
+ "refId": "B",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "[[pool_name]] Pool Throughput",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "ceph",
+ "pools"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Cluster",
+ "multi": false,
+ "name": "ceph_cluster",
+ "options": [],
+ "query": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 2,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "auto": true,
+ "auto_count": 10,
+ "auto_min": "1m",
+ "current": {
+ "text": "1m",
+ "value": "1m"
+ },
+ "datasource": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "Interval",
+ "multi": false,
+ "name": "interval",
+ "options": [
+ {
+ "selected": false,
+ "text": "auto",
+ "value": "$__auto_interval_interval"
+ },
+ {
+ "selected": true,
+ "text": "1m",
+ "value": "1m"
+ },
+ {
+ "selected": false,
+ "text": "10m",
+ "value": "10m"
+ },
+ {
+ "selected": false,
+ "text": "30m",
+ "value": "30m"
+ },
+ {
+ "selected": false,
+ "text": "1h",
+ "value": "1h"
+ },
+ {
+ "selected": false,
+ "text": "6h",
+ "value": "6h"
+ },
+ {
+ "selected": false,
+ "text": "12h",
+ "value": "12h"
+ },
+ {
+ "selected": false,
+ "text": "1d",
+ "value": "1d"
+ },
+ {
+ "selected": false,
+ "text": "7d",
+ "value": "7d"
+ },
+ {
+ "selected": false,
+ "text": "14d",
+ "value": "14d"
+ },
+ {
+ "selected": false,
+ "text": "30d",
+ "value": "30d"
+ }
+ ],
+ "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d",
+ "refresh": 2,
+ "skipUrlSync": false,
+ "type": "interval"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(ceph_pool_objects{release_group=\"$ceph_cluster\", nc_region=\"$region\"}, pool_id)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Pool",
+ "multi": false,
+ "name": "pool",
+ "options": [],
+ "query": "label_values(ceph_pool_objects{release_group=\"$ceph_cluster\", nc_region=\"$region\"}, pool_id)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Pool",
+ "multi": false,
+ "name": "pool_name",
+ "options": [],
+ "query": "label_values(ceph_pool_metadata{release_group=\"$ceph_cluster\",pool_id=\"[[pool]]\" }, name)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Ceph - Pools",
+ "uid": "ceph-pools",
+ "version": 5
+ }
+ armada_dashboard: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 104,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 9,
+ "panels": [],
+ "title": "Deployment Health",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 0,
+ "y": 1
+ },
+ "id": 23,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "armada_apply_failure_total{manifest=~\"$manifest\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "Armada Apply",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Armada Apply Failures",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 12,
+ "y": 1
+ },
+ "id": 28,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "armada_chart_deploy_attempt_total{manifest=~\"$manifest\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{chart}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Helm Chart Attempts",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 0,
+ "y": 10
+ },
+ "id": 7,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(armada_chart_handle_failure_total{manifest=~\"$manifest\"})",
+ "format": "time_series",
+ "hide": false,
+ "instant": false,
+ "intervalFactor": 1,
+ "legendFormat": "Chart Failures",
+ "refId": "A"
+ },
+ {
+ "expr": "sum(armada_chart_test_failure_total{manifest=~\"$manifest\"}) ",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 1,
+ "legendFormat": "Chart Test Failures",
+ "refId": "C"
+ },
+ {
+ "expr": "sum(armada_chart_deploy_failure_total{manifest=~\"$manifest\",nc_region=~\"$region\"}) ",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 1,
+ "legendFormat": "Chart Deploy Failures",
+ "refId": "D"
+ },
+ {
+ "expr": "sum(armada_chart_deploy_failure_total{manifest=~\"$manifest\",action=\"install\",nc_region=~\"$region\"}) ",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 1,
+ "legendFormat": "Chart Deploy Install Failures",
+ "refId": "B"
+ },
+ {
+ "expr": "sum(armada_chart_deploy_failure_total{manifest=~\"$manifest\",action=\"upgrade\",nc_region=~\"$region\"}) ",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 1,
+ "legendFormat": "Chart Deploy Upgrade Failures",
+ "refId": "E"
+ },
+ {
+ "expr": "sum(armada_chart_deploy_failure_total{manifest=~\"$manifest\",action=\"noop\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 1,
+ "legendFormat": "Chart Deploy noop Failures",
+ "refId": "F"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Site Failures",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": "4",
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "columns": [],
+ "datasource": "${DS_PROMETHEUS}",
+ "fontSize": "100%",
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 12,
+ "y": 10
+ },
+ "id": 27,
+ "links": [],
+ "options": {},
+ "pageSize": null,
+ "scroll": true,
+ "showHeader": true,
+ "sort": {
+ "col": 0,
+ "desc": true
+ },
+ "styles": [
+ {
+ "alias": "Time",
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "pattern": "Time",
+ "type": "date"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "decimals": 2,
+ "pattern": "chart",
+ "thresholds": [],
+ "type": "string",
+ "unit": "short"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "manifest",
+ "thresholds": [],
+ "type": "string",
+ "unit": "short"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "Value",
+ "thresholds": [],
+ "type": "number",
+ "unit": "short"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "/.*/",
+ "thresholds": [],
+ "type": "hidden",
+ "unit": "short"
+ }
+ ],
+ "targets": [
+ {
+ "expr": "armada_chart_handle_failure_total{nc_region=~\"$region\"}>0",
+ "format": "table",
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "title": "Failed Charts",
+ "transform": "table",
+ "type": "table"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 19
+ },
+ "id": 19,
+ "panels": [],
+ "title": "Deployment Progress",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": true,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 0,
+ "y": 20
+ },
+ "id": 15,
+ "legend": {
+ "alignAsTable": false,
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "sideWidth": null,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "armada_chart_handle_attempt_inprogress{manifest=~\"$manifest\",nc_region=~\"$region\"}>0",
+ "format": "time_series",
+ "instant": false,
+ "intervalFactor": 1,
+ "legendFormat": "{{chart}}",
+ "refId": "A"
+ },
+ {
+ "expr": "count(armada_chart_handle_attempt_inprogress{manifest=~\"$manifest\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "hide": true,
+ "intervalFactor": 1,
+ "legendFormat": "Total chart attempts",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Deployment Progress",
+ "tooltip": {
+ "shared": false,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": "1",
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "columns": [],
+ "datasource": "${DS_PROMETHEUS}",
+ "fontSize": "100%",
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 12,
+ "y": 20
+ },
+ "id": 21,
+ "links": [],
+ "options": {},
+ "pageSize": null,
+ "scroll": true,
+ "showHeader": true,
+ "sort": {
+ "col": 0,
+ "desc": true
+ },
+ "styles": [
+ {
+ "alias": "Time",
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "pattern": "Time",
+ "type": "hidden"
+ },
+ {
+ "alias": "Chart",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "link": false,
+ "pattern": "Metric",
+ "thresholds": [],
+ "type": "string",
+ "unit": "short"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "Value",
+ "thresholds": [],
+ "type": "hidden",
+ "unit": "short"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "decimals": 2,
+ "pattern": "/.*/",
+ "thresholds": [],
+ "type": "number",
+ "unit": "short"
+ }
+ ],
+ "targets": [
+ {
+ "expr": "armada_chart_deploy_attempt_inprogress{manifest=~\"$manifest\",nc_region=~\"$region\"}>0",
+ "format": "time_series",
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "{{chart}}",
+ "refId": "A"
+ }
+ ],
+ "title": "Current Running Charts",
+ "transform": "timeseries_to_rows",
+ "type": "table"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 29
+ },
+ "id": 11,
+ "panels": [],
+ "title": "Timeout usage",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": true,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 0,
+ "y": 30
+ },
+ "id": 2,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 300,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": false,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "(armada_chart_deploy_timeout_usage_ratio_sum{manifest=~\"$manifest\",action=~\"$action\",nc_region=~\"$region\"})*100>10",
+ "format": "time_series",
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "{{chart}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [
+ {
+ "colorMode": "ok",
+ "fill": true,
+ "line": true,
+ "op": "gt",
+ "value": 0
+ },
+ {
+ "colorMode": "warning",
+ "fill": true,
+ "line": true,
+ "op": "gt",
+ "value": 50
+ },
+ {
+ "colorMode": "critical",
+ "fill": true,
+ "line": true,
+ "op": "gt",
+ "value": 80
+ }
+ ],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Percentage Chart Timeout Usage > 10%",
+ "tooltip": {
+ "shared": false,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "series",
+ "name": null,
+ "show": false,
+ "values": [
+ "avg"
+ ]
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "Percentage of timeout used",
+ "logBase": 1,
+ "max": "100",
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": true,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 12,
+ "y": 30
+ },
+ "id": 5,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 300,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": false,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "(armada_chart_deploy_timeout_usage_ratio_sum{manifest=~\"$manifest\",action=~\"$action\",nc_region=~\"$region\"})*100<10",
+ "format": "time_series",
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "{{chart}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [
+ {
+ "colorMode": "ok",
+ "fill": true,
+ "line": true,
+ "op": "lt",
+ "value": 10
+ },
+ {
+ "colorMode": "warning",
+ "fill": true,
+ "line": true,
+ "op": "lt",
+ "value": 5
+ },
+ {
+ "colorMode": "critical",
+ "fill": true,
+ "line": true,
+ "op": "lt",
+ "value": 1
+ }
+ ],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Percentage Chart Timeout Usage < 10%",
+ "tooltip": {
+ "shared": false,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "series",
+ "name": null,
+ "show": false,
+ "values": [
+ "avg"
+ ]
+ },
+ "yaxes": [
+ {
+ "decimals": null,
+ "format": "short",
+ "label": "Percentage of timeout used",
+ "logBase": 1,
+ "max": "10",
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": true,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 0,
+ "y": 39
+ },
+ "id": 25,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": false,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 300,
+ "sortDesc": false,
+ "total": false,
+ "values": true
+ },
+ "lines": false,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "armada_chart_handle_concurrency_count_sum{manifest=~\"$manifest\",nc_region=~\"$region\"}/armada_chart_handle_concurrency_count_count{manifest=~\"$manifest\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{chart}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Max Concurrency by Chart",
+ "tooltip": {
+ "shared": false,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "series",
+ "name": null,
+ "show": false,
+ "values": [
+ "max"
+ ]
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "Concurrency",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": false,
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {
+ "selected": false,
+ "tags": [],
+ "text": "full-site",
+ "value": [
+ "full-site"
+ ]
+ },
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Manifest",
+ "multi": true,
+ "name": "manifest",
+ "options": [
+ {
+ "selected": true,
+ "text": "full-site",
+ "value": "full-site"
+ }
+ ],
+ "query": "armada_apply_attempt_total",
+ "refresh": 0,
+ "regex": "/.*manifest=\"(.*?)\".*/",
+ "skipUrlSync": false,
+ "sort": 1,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {
+ "tags": [],
+ "text": "install + upgrade",
+ "value": [
+ "install",
+ "upgrade"
+ ]
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Armada Action",
+ "multi": true,
+ "name": "action",
+ "options": [
+ {
+ "selected": true,
+ "text": "install",
+ "value": "install"
+ },
+ {
+ "selected": false,
+ "text": "upgrade",
+ "value": "upgrade"
+ },
+ {
+ "selected": false,
+ "text": "noop",
+ "value": "noop"
+ }
+ ],
+ "query": "install,upgrade,noop",
+ "skipUrlSync": false,
+ "type": "custom"
+ }
+ ]
+ },
+ "time": {
+ "from": "now-6h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "browser",
+ "title": "Armada Dashboard",
+ "uid": "armada-dashboard",
+ "version": 1
+ }
+ containers: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.3.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Monitors Kubernetes cluster using Prometheus. Shows overall cluster CPU / Memory / Filesystem usage as well as individual pod, containers, systemd services statistics. Uses cAdvisor metrics only.",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": 315,
+ "graphTooltip": 0,
+ "id": 209,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 33,
+ "panels": [],
+ "title": "Network I/O pressure",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 5,
+ "w": 24,
+ "x": 0,
+ "y": 1
+ },
+ "height": "200px",
+ "id": 32,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": false,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": false,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum (rate (container_network_receive_bytes_total{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[10m]))",
+ "format": "time_series",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "Received",
+ "metric": "network",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "- sum (rate (container_network_transmit_bytes_total{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[10m]))",
+ "format": "time_series",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "Sent",
+ "metric": "network",
+ "refId": "B",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Network I/O pressure",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 6
+ },
+ "id": 34,
+ "panels": [],
+ "title": "Total usage",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 8,
+ "x": 0,
+ "y": 7
+ },
+ "height": "180px",
+ "id": 4,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum (container_memory_working_set_bytes{id=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) / sum (machine_memory_bytes{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) * 100",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "65, 90",
+ "title": "Cluster memory usage",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 8,
+ "x": 8,
+ "y": 7
+ },
+ "height": "180px",
+ "id": 6,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum (rate (container_cpu_usage_seconds_total{id=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) / sum (machine_cpu_cores{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) * 100",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "65, 90",
+ "title": "Cluster CPU usage (5m avg)",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 8,
+ "x": 16,
+ "y": 7
+ },
+ "height": "180px",
+ "id": 7,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "max(sum (container_fs_usage_bytes{device=~\"^/dev/[sv]da[0-9]$\",nc_region=~\"$region\"}) by (kubernetes_io_hostname) / sum (container_fs_limit_bytes{device=~\"^/dev/[sv]da[0-9]$\",nc_region=~\"$region\"}) by (kubernetes_io_hostname) * 100)",
+ "format": "time_series",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "65, 90",
+ "title": "Cluster filesystem usage",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "bytes",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 0,
+ "y": 12
+ },
+ "height": "1px",
+ "id": 9,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "20%",
+ "prefix": "",
+ "prefixFontSize": "20%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum (container_memory_working_set_bytes{id=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"})",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "",
+ "title": "Used",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "bytes",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 4,
+ "y": 12
+ },
+ "height": "1px",
+ "id": 10,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum (machine_memory_bytes{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"})",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "",
+ "title": "Total",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 8,
+ "y": 12
+ },
+ "height": "1px",
+ "id": 11,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": " cores",
+ "postfixFontSize": "30%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum (rate (container_cpu_usage_seconds_total{id=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m]))",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "",
+ "title": "Used",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 12,
+ "y": 12
+ },
+ "height": "1px",
+ "id": 12,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": " cores",
+ "postfixFontSize": "30%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum (machine_cpu_cores{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"})",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "",
+ "title": "Total",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "bytes",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 16,
+ "y": 12
+ },
+ "height": "1px",
+ "id": 13,
+ "interval": "",
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum (container_fs_usage_bytes{device=~\"^/dev/[sv]da[0-9]$\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "",
+ "title": "Used",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "$DS_PROMETHEUS",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "format": "bytes",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 20,
+ "y": 12
+ },
+ "height": "1px",
+ "id": 14,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(container_fs_limit_bytes{device=~\"^/dev/[sv]da[0-9]$\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": "",
+ "title": "Total",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 15
+ },
+ "id": 35,
+ "panels": [],
+ "title": "Pods CPU usage",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 3,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 16
+ },
+ "height": "",
+ "id": 17,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (pod)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "{{ pod }}",
+ "metric": "container_cpu",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Pods CPU usage (5m avg)",
+ "tooltip": {
+ "msResolution": true,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "cores",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 23
+ },
+ "id": 36,
+ "panels": [],
+ "title": "Containers CPU usage",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 3,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 24
+ },
+ "height": "",
+ "id": 24,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": null,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",name=~\"^k8s_.*\",container!=\"POD\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (container, pod)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "pod: {{ pod }} | {{ container }}",
+ "metric": "container_cpu",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, name, image)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})",
+ "metric": "container_cpu",
+ "refId": "B",
+ "step": 10
+ },
+ {
+ "expr": "sum (rate (container_cpu_usage_seconds_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}",
+ "metric": "container_cpu",
+ "refId": "C",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Containers CPU usage (5m avg)",
+ "tooltip": {
+ "msResolution": true,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "cores",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 31
+ },
+ "id": 37,
+ "panels": [],
+ "repeat": null,
+ "title": "All processes CPU usage",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 3,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 13,
+ "w": 24,
+ "x": 0,
+ "y": 32
+ },
+ "id": 20,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "sum (rate (container_cpu_usage_seconds_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (id)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "{{ id }}",
+ "metric": "container_cpu",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "All processes CPU usage (5m avg)",
+ "tooltip": {
+ "msResolution": true,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "cores",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 45
+ },
+ "id": 38,
+ "panels": [],
+ "title": "Pods memory usage",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 46
+ },
+ "id": 25,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "sum (container_memory_working_set_bytes{image!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (pod)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "{{ pod }}",
+ "metric": "container_memory_usage:sort_desc",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Pods memory usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 53
+ },
+ "id": 39,
+ "panels": [],
+ "title": "Containers memory usage",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 54
+ },
+ "id": 27,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "sum (container_memory_working_set_bytes{image!=\"\",name=~\"^k8s_.*\",container!=\"POD\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (container, pod)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "pod: {{ pod }} | {{ container }}",
+ "metric": "container_memory_usage:sort_desc",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "sum (container_memory_working_set_bytes{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (kubernetes_io_hostname, name, image)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})",
+ "metric": "container_memory_usage:sort_desc",
+ "refId": "B",
+ "step": 10
+ },
+ {
+ "expr": "sum (container_memory_working_set_bytes{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (kubernetes_io_hostname, rkt_container_name)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}",
+ "metric": "container_memory_usage:sort_desc",
+ "refId": "C",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Containers memory usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 61
+ },
+ "id": 40,
+ "panels": [],
+ "title": "All processes memory usage",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 13,
+ "w": 24,
+ "x": 0,
+ "y": 62
+ },
+ "id": 28,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "sum (container_memory_working_set_bytes{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (id)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "{{ id }}",
+ "metric": "container_memory_usage:sort_desc",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "All processes memory usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 75
+ },
+ "id": 41,
+ "panels": [],
+ "title": "Pods network I/O",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 76
+ },
+ "id": 16,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (pod)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "-> {{ pod }}",
+ "metric": "network",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (pod)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "<- {{ pod }}",
+ "metric": "network",
+ "refId": "B",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Pods network I/O (5m avg)",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 83
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Containers network I/O",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 84
+ },
+ "id": 30,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",name=~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (container, pod)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "-> pod: {{ pod }} | {{ container }}",
+ "metric": "network",
+ "refId": "B",
+ "step": 10
+ },
+ {
+ "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",name=~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (container, pod)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "<- pod: {{ pod }} | {{ container }}",
+ "metric": "network",
+ "refId": "D",
+ "step": 10
+ },
+ {
+ "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, name, image)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "-> docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})",
+ "metric": "network",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, name, image)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "<- docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})",
+ "metric": "network",
+ "refId": "C",
+ "step": 10
+ },
+ {
+ "expr": "sum (rate (container_network_transmit_bytes_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "-> rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}",
+ "metric": "network",
+ "refId": "E",
+ "step": 10
+ },
+ {
+ "expr": "- sum (rate (container_network_transmit_bytes_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "<- rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}",
+ "metric": "network",
+ "refId": "F",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Containers network I/O (5m avg)",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 91
+ },
+ "id": 43,
+ "panels": [],
+ "title": "All processes network I/O",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 13,
+ "w": 24,
+ "x": 0,
+ "y": 92
+ },
+ "id": 29,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum (rate (container_network_receive_bytes_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (id)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "-> {{ id }}",
+ "metric": "network",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "- sum (rate (container_network_transmit_bytes_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (id)",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "<- {{ id }}",
+ "metric": "network",
+ "refId": "B",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "All processes network I/O (5m avg)",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "kubernetes"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": ".+",
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": ".+",
+ "current": {
+ "text": "All",
+ "value": "$__all"
+ },
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(node_uname_info{nc_region=~\"$region\"}, hostname)",
+ "hide": 0,
+ "includeAll": true,
+ "label": "Node",
+ "multi": false,
+ "name": "Node",
+ "options": [],
+ "query": "label_values(node_uname_info{nc_region=~\"$region\"}, hostname)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-5m",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Container Metrics (cAdvisor)",
+ "uid": "container-metrics",
+ "version": 1
+ }
+ coredns: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.3.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "A dashboard for the CoreDNS DNS server.",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": 5926,
+ "graphTooltip": 0,
+ "id": 85,
+ "links": [],
+ "panels": [
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 4,
+ "x": 0,
+ "y": 0
+ },
+ "id": 22,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "$$hashKey": "object:956",
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "$$hashKey": "object:957",
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "version",
+ "targets": [
+ {
+ "expr": "coredns_build_info",
+ "format": "table",
+ "instant": true,
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Version",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [],
+ "valueName": "first"
+ },
+ {
+ "datasource": null,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 5
+ },
+ "id": 24,
+ "title": "Row title",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 0,
+ "y": 6
+ },
+ "hiddenSeries": false,
+ "id": 1,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "total",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (proto)",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m]))",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "total",
+ "refId": "B",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Requests (total)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 8,
+ "y": 6
+ },
+ "hiddenSeries": false,
+ "id": 12,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "total",
+ "yaxis": 2
+ },
+ {
+ "alias": "other",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (type)",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{type}}",
+ "refId": "A",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Requests (by qtype)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 16,
+ "y": 6
+ },
+ "hiddenSeries": false,
+ "id": 2,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "total",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (zone)",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{zone}}",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m]))",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "total",
+ "refId": "B",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Requests (by zone)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 13
+ },
+ "hiddenSeries": false,
+ "id": 10,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "total",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(coredns_dns_requests_do_count_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m]))",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "DO",
+ "refId": "A",
+ "step": 40
+ },
+ {
+ "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m]))",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "total",
+ "refId": "B",
+ "step": 40
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Requests (DO bit)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 12,
+ "y": 13
+ },
+ "hiddenSeries": false,
+ "id": 9,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "tcp:90",
+ "yaxis": 2
+ },
+ {
+ "alias": "tcp:99 ",
+ "yaxis": 2
+ },
+ {
+ "alias": "tcp:50",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto))",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:99 ",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto))",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:90",
+ "refId": "B",
+ "step": 60
+ },
+ {
+ "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto))",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:50",
+ "refId": "C",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Requests (size, udp)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 18,
+ "y": 13
+ },
+ "hiddenSeries": false,
+ "id": 14,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "tcp:90",
+ "yaxis": 1
+ },
+ {
+ "alias": "tcp:99 ",
+ "yaxis": 1
+ },
+ {
+ "alias": "tcp:50",
+ "yaxis": 1
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto))",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:99 ",
+ "refId": "A",
+ "step": 60
+ },
+ {
+ "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto))",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:90",
+ "refId": "B",
+ "step": 60
+ },
+ {
+ "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto))",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:50",
+ "refId": "C",
+ "step": 60
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Requests (size,tcp)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 20
+ },
+ "hiddenSeries": false,
+ "id": 5,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(coredns_dns_responses_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (rcode)",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{rcode}}",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Responses (by rcode)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 20
+ },
+ "hiddenSeries": false,
+ "id": 3,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (le, job))",
+ "intervalFactor": 2,
+ "legendFormat": "99%",
+ "refId": "A",
+ "step": 40
+ },
+ {
+ "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (le))",
+ "intervalFactor": 2,
+ "legendFormat": "90%",
+ "refId": "B",
+ "step": 40
+ },
+ {
+ "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (le))",
+ "intervalFactor": 2,
+ "legendFormat": "50%",
+ "refId": "C",
+ "step": 40
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Responses (duration)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 27
+ },
+ "hiddenSeries": false,
+ "id": 8,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "udp:50%",
+ "yaxis": 1
+ },
+ {
+ "alias": "tcp:50%",
+ "yaxis": 2
+ },
+ {
+ "alias": "tcp:90%",
+ "yaxis": 2
+ },
+ {
+ "alias": "tcp:99%",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:99%",
+ "refId": "A",
+ "step": 40
+ },
+ {
+ "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:90%",
+ "refId": "B",
+ "step": 40
+ },
+ {
+ "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:50%",
+ "metric": "",
+ "refId": "C",
+ "step": 40
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Responses (size, udp)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 27
+ },
+ "hiddenSeries": false,
+ "id": 13,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "udp:50%",
+ "yaxis": 1
+ },
+ {
+ "alias": "tcp:50%",
+ "yaxis": 1
+ },
+ {
+ "alias": "tcp:90%",
+ "yaxis": 1
+ },
+ {
+ "alias": "tcp:99%",
+ "yaxis": 1
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:99%",
+ "refId": "A",
+ "step": 40
+ },
+ {
+ "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:90%",
+ "refId": "B",
+ "step": 40
+ },
+ {
+ "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le, proto)) ",
+ "intervalFactor": 2,
+ "legendFormat": "{{proto}}:50%",
+ "metric": "",
+ "refId": "C",
+ "step": 40
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Responses (size, tcp)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 34
+ },
+ "hiddenSeries": false,
+ "id": 15,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(coredns_cache_entries{instance=~\"$instance\",nc_region=~\"$region\"}) by (type)",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{type}}",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cache (size)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 34
+ },
+ "hiddenSeries": false,
+ "id": 16,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pluginVersion": "7.4.5",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "misses",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(coredns_cache_hits_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (type)",
+ "intervalFactor": 2,
+ "legendFormat": "hits:{{type}}",
+ "refId": "A",
+ "step": 40
+ },
+ {
+ "expr": "sum(rate(coredns_cache_misses_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (type)",
+ "intervalFactor": 2,
+ "legendFormat": "misses",
+ "refId": "B",
+ "step": 40
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cache (hitrate)",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "pps",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "schemaVersion": 27,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "selected": false,
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "description": null,
+ "error": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": ".+",
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "description": null,
+ "error": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": {
+ "query": "label_values(nc_region)",
+ "refId": "prometheus-region-Variable-Query"
+ },
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": ".*",
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "description": null,
+ "error": null,
+ "hide": 0,
+ "includeAll": true,
+ "label": "Instance",
+ "multi": false,
+ "name": "instance",
+ "options": [],
+ "query": {
+ "query": "up{job=\"coredns\",nc_region=~\"$region\"}",
+ "refId": "prometheus-instance-Variable-Query"
+ },
+ "refresh": 1,
+ "regex": ".*instance=\"(.*?)\".*",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "now": true,
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "CoreDNS",
+ "uid": "coredns",
+ "version": 4
+ }
+ kubernetes_etcd: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "etcd Grafana dashboard with Prometheus",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 290,
+ "links": [],
+ "panels": [
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 0,
+ "y": 0
+ },
+ "id": 28,
+ "interval": null,
+ "isNew": true,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(etcd_server_has_leader{job=\"$cluster\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "metric": "etcd_server_has_leader",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": "",
+ "title": "Up",
+ "type": "singlestat",
+ "valueFontSize": "200%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 6,
+ "y": 0
+ },
+ "id": 23,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(grpc_server_started_total{job=\"$cluster\",grpc_type=\"unary\",nc_region=~\"$region\"}[5m]))",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "RPC Rate",
+ "metric": "grpc_server_started_total",
+ "refId": "A",
+ "step": 2
+ },
+ {
+ "expr": "sum(rate(grpc_server_handled_total{job=\"$cluster\",grpc_type=\"unary\",grpc_code!=\"OK\",nc_region=~\"$region\"}[5m]))",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "RPC Failed Rate",
+ "metric": "grpc_server_handled_total",
+ "refId": "B",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "RPC Rate",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "ops",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 16,
+ "y": 0
+ },
+ "id": 41,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(grpc_server_started_total{job=\"$cluster\",grpc_service=\"etcdserverpb.Watch\",grpc_type=\"bidi_stream\",nc_region=~\"$region\"}) - sum(grpc_server_handled_total{job=\"$cluster\",grpc_service=\"etcdserverpb.Watch\",grpc_type=\"bidi_stream\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Watch Streams",
+ "metric": "grpc_server_handled_total",
+ "refId": "A",
+ "step": 4
+ },
+ {
+ "expr": "sum(grpc_server_started_total{job=\"$cluster\",grpc_service=\"etcdserverpb.Lease\",grpc_type=\"bidi_stream\",nc_region=~\"$region\"}) - sum(grpc_server_handled_total{job=\"$cluster\",grpc_service=\"etcdserverpb.Lease\",grpc_type=\"bidi_stream\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Lease Streams",
+ "metric": "grpc_server_handled_total",
+ "refId": "B",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Active Streams",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": null,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 0,
+ "y": 7
+ },
+ "id": 1,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "etcd_mvcc_db_total_size_in_bytes{job=\"$cluster\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "hide": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} DB Size",
+ "metric": "",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "DB Size",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 8,
+ "y": 7
+ },
+ "id": 3,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 1,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "histogram_quantile(0.99, sum(rate(etcd_disk_wal_fsync_duration_seconds_bucket{job=\"$cluster\",nc_region=~\"$region\"}[5m])) by (instance, le))",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} WAL fsync",
+ "metric": "etcd_disk_wal_fsync_duration_seconds_bucket",
+ "refId": "A",
+ "step": 4
+ },
+ {
+ "expr": "histogram_quantile(0.99, sum(rate(etcd_disk_backend_commit_duration_seconds_bucket{job=\"$cluster\",nc_region=~\"$region\"}[5m])) by (instance, le))",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} DB fsync",
+ "metric": "etcd_disk_backend_commit_duration_seconds_bucket",
+ "refId": "B",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Disk Sync Duration",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 16,
+ "y": 7
+ },
+ "id": 29,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "process_resident_memory_bytes{job=\"$cluster\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} Resident Memory",
+ "metric": "process_resident_memory_bytes",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Memory",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 5,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 0,
+ "y": 14
+ },
+ "id": 22,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(etcd_network_client_grpc_received_bytes_total{job=\"$cluster\",nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} Client Traffic In",
+ "metric": "etcd_network_client_grpc_received_bytes_total",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Client Traffic In",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 5,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 6,
+ "y": 14
+ },
+ "id": 21,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(etcd_network_client_grpc_sent_bytes_total{job=\"$cluster\",nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} Client Traffic Out",
+ "metric": "etcd_network_client_grpc_sent_bytes_total",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Client Traffic Out",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 12,
+ "y": 14
+ },
+ "id": 20,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(etcd_network_peer_received_bytes_total{job=\"$cluster\",nc_region=~\"$region\"}[5m])) by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} Peer Traffic In",
+ "metric": "etcd_network_peer_received_bytes_total",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Peer Traffic In",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": null,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 18,
+ "y": 14
+ },
+ "id": 16,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(etcd_network_peer_sent_bytes_total{job=\"$cluster\",nc_region=~\"$region\"}[5m])) by (instance)",
+ "format": "time_series",
+ "hide": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} Peer Traffic Out",
+ "metric": "etcd_network_peer_sent_bytes_total",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Peer Traffic Out",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 21
+ },
+ "id": 40,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(etcd_server_proposals_failed_total{job=\"$cluster\",nc_region=~\"$region\"}[5m]))",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Proposal Failure Rate",
+ "metric": "etcd_server_proposals_failed_total",
+ "refId": "A",
+ "step": 2
+ },
+ {
+ "expr": "sum(etcd_server_proposals_pending{job=\"$cluster\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Proposal Pending Total",
+ "metric": "etcd_server_proposals_pending",
+ "refId": "B",
+ "step": 2
+ },
+ {
+ "expr": "sum(rate(etcd_server_proposals_committed_total{job=\"$cluster\",nc_region=~\"$region\"}[5m]))",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Proposal Commit Rate",
+ "metric": "etcd_server_proposals_committed_total",
+ "refId": "C",
+ "step": 2
+ },
+ {
+ "expr": "sum(rate(etcd_server_proposals_applied_total{job=\"$cluster\",nc_region=~\"$region\"}[5m]))",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Proposal Apply Rate",
+ "refId": "D",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Raft Proposals",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 21
+ },
+ "id": 19,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": false,
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "changes(etcd_server_leader_changes_seen_total{job=\"$cluster\",nc_region=~\"$region\"}[1d])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{instance}} Total Leader Elections Per Day",
+ "metric": "etcd_server_leader_changes_seen_total",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Total Leader Elections Per Day",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "1m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 1,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(etcd_server_has_leader{nc_region=~\"$region\"}, job)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "cluster",
+ "multi": false,
+ "name": "cluster",
+ "options": [],
+ "query": "label_values(etcd_server_has_leader{nc_region=~\"$region\"}, job)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 2,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "now": true,
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Kubernetes etcd",
+ "uid": "kubernetes-etcd",
+ "version": 5
+ }
+ kubernetes_cluster_status: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 218,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 11,
+ "panels": [],
+ "repeat": null,
+ "title": "Cluster Health",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 0,
+ "y": 1
+ },
+ "id": 5,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(up{job=~\"apiserver|kube-scheduler|kube-controller-manager\",nc_region=~\"$region\"} == 0)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 600
+ }
+ ],
+ "thresholds": "1,3",
+ "title": "Control Plane UP",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "UP",
+ "value": "null"
+ }
+ ],
+ "valueName": "total"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 6,
+ "y": 1
+ },
+ "id": 6,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(ALERTS{alertstate=\"firing\",alertname!=\"DeadMansSwitch\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 600
+ }
+ ],
+ "thresholds": "3,5",
+ "title": "Alerts Firing",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": null,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 12,
+ "y": 1
+ },
+ "hideTimeOverride": false,
+ "id": 4,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "count(increase(kube_pod_container_status_restarts_total{nc_region=~\"$region\"}[1h]) > 5)",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 600
+ }
+ ],
+ "thresholds": "1,3",
+ "title": "Crashlooping Control Plane Pods",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": null,
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 18,
+ "y": 1
+ },
+ "id": 1,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "(sum(up{job=\"apiserver\",nc_region=~\"$region\"} == 1) / count(up{job=\"apiserver\",nc_region=~\"$region\"})) * 100",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 600
+ }
+ ],
+ "thresholds": "50,80",
+ "title": "API Servers UP",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 5
+ },
+ "id": 13,
+ "panels": [],
+ "repeat": null,
+ "title": "Capacity Planing",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 6,
+ "x": 0,
+ "y": 6
+ },
+ "id": 8,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(100 - (avg by (instance) (rate(node_cpu_seconds_total{job=\"node-exporter\",mode=\"idle\"}[5m])) * 100)) / count(node_cpu_seconds_total{job=\"node-exporter\",mode=\"idle\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 600
+ }
+ ],
+ "thresholds": "80,90",
+ "title": "CPU Utilization",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 6,
+ "x": 6,
+ "y": 6
+ },
+ "id": 7,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "((sum(node_memory_MemTotal_bytes) - sum(node_memory_MemFree_bytes) - sum(node_memory_Buffers_bytes) - sum(node_memory_Cached_bytes)) / sum(node_memory_MemTotal_bytes)) * 100",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 600
+ }
+ ],
+ "thresholds": "80,90",
+ "title": "Memory Utilization",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 6,
+ "x": 12,
+ "y": 6
+ },
+ "id": 9,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "(sum(node_filesystem_size_bytes{device!=\"rootfs\",nc_region=~\"$region\"}) - sum(node_filesystem_free_bytes{device!=\"rootfs\",nc_region=~\"$region\"})) / sum(node_filesystem_size_bytes{device!=\"rootfs\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 600
+ }
+ ],
+ "thresholds": "80,90",
+ "title": "Filesystem Utilization",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 6,
+ "x": 18,
+ "y": 6
+ },
+ "id": 10,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "100 - (sum(kube_node_status_capacity{resource=\"pods\"}) by (nc_region) - sum(kube_pod_info) by (nc_region))/ sum(kube_node_status_capacity{resource=\"pods\"}) by (nc_region)* 100",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 600
+ }
+ ],
+ "thresholds": "80,90",
+ "title": "Pod Utilization",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "fill": 1,
+ "gridPos": {
+ "h": 6,
+ "w": 6,
+ "x": 0,
+ "y": 11
+ },
+ "id": 17,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(kube_node_status_capacity{resource=\"cpu\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "allocatable",
+ "refId": "A"
+ },
+ {
+ "expr": "sum(kube_node_status_allocatable{resource=\"cpu\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "capacity",
+ "refId": "B"
+ },
+ {
+ "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "requested",
+ "refId": "C"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cluster CPU Capacity",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": null,
+ "format": "none",
+ "label": "cores",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "fill": 1,
+ "gridPos": {
+ "h": 6,
+ "w": 6,
+ "x": 6,
+ "y": 11
+ },
+ "id": 19,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(kube_node_status_allocatable{resource=\"memory\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "allocatable",
+ "refId": "A"
+ },
+ {
+ "expr": "sum(kube_node_status_capacity{resource=\"memory\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "capacity",
+ "refId": "B"
+ },
+ {
+ "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "requested",
+ "refId": "C"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cluster Mem Capacity",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "fill": 1,
+ "gridPos": {
+ "h": 6,
+ "w": 6,
+ "x": 12,
+ "y": 11
+ },
+ "id": 21,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(node_filesystem_size_bytes{nc_region=~\"$region\"}) - sum(node_filesystem_free_bytes{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "usage",
+ "refId": "A"
+ },
+ {
+ "expr": "sum(node_filesystem_size_bytes{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "limit",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cluster Disk Capacity",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "fill": 1,
+ "gridPos": {
+ "h": 6,
+ "w": 6,
+ "x": 18,
+ "y": 11
+ },
+ "id": 15,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(kube_node_status_allocatable{resource=\"pods\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "allocatable",
+ "refId": "A"
+ },
+ {
+ "expr": "sum(kube_node_status_capacity{resource=\"pods\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "capacity",
+ "refId": "B"
+ },
+ {
+ "expr": "sum(kube_pod_info)",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "requested",
+ "refId": "C"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cluster Pod Capacity",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "pods",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 17
+ },
+ "id": 37,
+ "panels": [],
+ "title": "Nodes",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 8,
+ "x": 0,
+ "y": 18
+ },
+ "id": 35,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_node_info)",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Number Of Nodes",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 8,
+ "x": 8,
+ "y": 18
+ },
+ "id": 39,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_node_status_condition{nnc_region=~\"$region\", condition=\"OutOfDisk\", status=\"true\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1",
+ "title": "Nodes Out of Disk",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 8,
+ "x": 16,
+ "y": 18
+ },
+ "id": 41,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_node_spec_unschedulable{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1",
+ "title": "Nodes Unavailable",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 21
+ },
+ "id": 25,
+ "panels": [],
+ "title": "Pods",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 5,
+ "x": 0,
+ "y": 22
+ },
+ "id": 23,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(78, 203, 42, 0.28)",
+ "full": false,
+ "lineColor": "#629e51",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Running\"})",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Pods Running",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 5,
+ "x": 5,
+ "y": 22
+ },
+ "id": 27,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(78, 203, 42, 0.28)",
+ "full": false,
+ "lineColor": "#629e51",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Pending\"})",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Pods Pending",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 5,
+ "x": 10,
+ "y": 22
+ },
+ "id": 29,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(78, 203, 42, 0.28)",
+ "full": false,
+ "lineColor": "#629e51",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Failed\"})",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Pods Failed",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 5,
+ "x": 15,
+ "y": 22
+ },
+ "id": 31,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(78, 203, 42, 0.28)",
+ "full": false,
+ "lineColor": "#629e51",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Succeeded\"})",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Pods Succeeded",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 4,
+ "x": 20,
+ "y": 22
+ },
+ "id": 33,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(78, 203, 42, 0.28)",
+ "full": false,
+ "lineColor": "#629e51",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Unknown\"})",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Pods Unknown",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 27
+ },
+ "id": 45,
+ "panels": [],
+ "title": "Containers",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 0,
+ "y": 28
+ },
+ "id": 43,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_container_status_running{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Containers Running",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 6,
+ "y": 28
+ },
+ "id": 47,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_container_status_waiting{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Containers Waiting",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 12,
+ "y": 28
+ },
+ "id": 49,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_container_status_terminated{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Containers Terminated",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 18,
+ "y": 28
+ },
+ "id": 51,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(delta(kube_pod_container_status_restarts_total{namespace!=\"kube-system\", nc_region=~\"$region\"}[30m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Containers Restarts (Last 30 Minutes)",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 12,
+ "x": 0,
+ "y": 32
+ },
+ "id": 53,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "CPU Cores Requested by Containers",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "decbytes",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 12,
+ "x": 12,
+ "y": 32
+ },
+ "id": 55,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Memory Requested By Containers",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 36
+ },
+ "id": 59,
+ "panels": [],
+ "title": "Jobs",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 8,
+ "x": 0,
+ "y": 37
+ },
+ "id": 57,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_job_status_succeeded{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Jobs Succeeded",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 8,
+ "x": 8,
+ "y": 37
+ },
+ "id": 61,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_job_status_active{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Jobs Active",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "prometheus",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 8,
+ "x": 16,
+ "y": 37
+ },
+ "id": 63,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(kube_job_status_failed{nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Jobs Failed",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ }
+ ],
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": ".+",
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Kubernetes Cluster Status",
+ "uid": "kubernetes-cluster-status",
+ "version": 3
+ }
+ nginx_stats: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "table",
+ "name": "Table",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ },
+ {
+ "datasource": "${DS_PROMETHEUS}",
+ "enable": true,
+ "expr": "sum(changes(nginx_ingress_controller_config_last_reload_successful_timestamp_seconds{instance!=\"unknown\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",nc_region=~\"$region\"}[30s])) by (controller_class)",
+ "hide": false,
+ "iconColor": "rgba(255, 96, 96, 1)",
+ "limit": 100,
+ "name": "Config Reloads",
+ "showIn": 0,
+ "step": "30s",
+ "tagKeys": "controller_class",
+ "tags": [],
+ "titleFormat": "Config Reloaded",
+ "type": "tags"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 191,
+ "links": [],
+ "panels": [
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "ops",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "id": 20,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "round(sum(irate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m])), 0.001)",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": "",
+ "title": "Controller Request Volume",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 6,
+ "x": 6,
+ "y": 0
+ },
+ "id": 82,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(avg_over_time(nginx_ingress_controller_nginx_process_connections{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "instant": false,
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": "",
+ "title": "Controller Connections",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "percentunit",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 80,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": false
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 6,
+ "x": 12,
+ "y": 0
+ },
+ "id": 21,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",status!~\"[4-5].*\",nc_region=~\"$region\"}[2m])) / sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": "95, 99, 99.5",
+ "title": "Controller Success Rate (non-4|5xx responses)",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 3,
+ "x": 18,
+ "y": 0
+ },
+ "id": 81,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "avg(nginx_ingress_controller_success{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "instant": true,
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": "",
+ "title": "Config Reloads",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 3,
+ "x": 21,
+ "y": 0
+ },
+ "id": 83,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "count(nginx_ingress_controller_config_last_reload_successful{controller_pod=~\"$controller\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"} == 0)",
+ "format": "time_series",
+ "instant": true,
+ "intervalFactor": 1,
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": "",
+ "title": "Last Config Failed",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 3
+ },
+ "height": "200px",
+ "id": 86,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "hideEmpty": false,
+ "hideZero": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 300,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "repeat": null,
+ "repeatDirection": "h",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "round(sum(irate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (ingress), 0.001)",
+ "format": "time_series",
+ "hide": false,
+ "instant": false,
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "{{ ingress }}",
+ "metric": "network",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Ingress Request Volume",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "max - istio-proxy": "#890f02",
+ "max - master": "#bf1b00",
+ "max - prometheus": "#bf1b00"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": false,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 3
+ },
+ "id": 87,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "hideEmpty": true,
+ "hideZero": false,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sideWidth": 300,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",ingress=~\"$ingress\",status!~\"[4-5].*\",nc_region=~\"$region\"}[2m])) by (ingress) / sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (ingress)",
+ "format": "time_series",
+ "instant": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "{{ ingress }}",
+ "metric": "container_memory_usage:sort_desc",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Ingress Success Rate (non-4|5xx responses)",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 1,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "percentunit",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 6,
+ "w": 8,
+ "x": 0,
+ "y": 10
+ },
+ "height": "200px",
+ "id": 32,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": false,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": false,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum (irate (nginx_ingress_controller_request_size_sum{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "instant": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "Received",
+ "metric": "network",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "- sum (irate (nginx_ingress_controller_response_size_sum{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "hide": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "Sent",
+ "metric": "network",
+ "refId": "B",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Network I/O pressure",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "max - istio-proxy": "#890f02",
+ "max - master": "#bf1b00",
+ "max - prometheus": "#bf1b00"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": false,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 6,
+ "w": 8,
+ "x": 8,
+ "y": 10
+ },
+ "id": 77,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": false,
+ "sideWidth": 200,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "avg(nginx_ingress_controller_nginx_process_resident_memory_bytes{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}) ",
+ "format": "time_series",
+ "instant": false,
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "nginx",
+ "metric": "container_memory_usage:sort_desc",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Average Memory Usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "max - istio-proxy": "#890f02",
+ "max - master": "#bf1b00"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 3,
+ "editable": false,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 6,
+ "w": 8,
+ "x": 16,
+ "y": 10
+ },
+ "height": "",
+ "id": 79,
+ "isNew": true,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": false,
+ "sort": null,
+ "sortDesc": null,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum (rate (nginx_ingress_controller_nginx_process_cpu_seconds_total{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m])) ",
+ "format": "time_series",
+ "interval": "10s",
+ "intervalFactor": 1,
+ "legendFormat": "nginx",
+ "metric": "container_cpu",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [
+ {
+ "colorMode": "critical",
+ "fill": true,
+ "line": true,
+ "op": "gt"
+ }
+ ],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Average CPU Usage",
+ "tooltip": {
+ "msResolution": true,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "cores",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "columns": [],
+ "datasource": "${DS_PROMETHEUS}",
+ "fontSize": "100%",
+ "gridPos": {
+ "h": 8,
+ "w": 24,
+ "x": 0,
+ "y": 16
+ },
+ "hideTimeOverride": false,
+ "id": 75,
+ "links": [],
+ "options": {},
+ "pageSize": 7,
+ "repeat": null,
+ "repeatDirection": "h",
+ "scroll": true,
+ "showHeader": true,
+ "sort": {
+ "col": 1,
+ "desc": true
+ },
+ "styles": [
+ {
+ "alias": "Ingress",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "ingress",
+ "preserveFormat": false,
+ "sanitize": false,
+ "thresholds": [],
+ "type": "string",
+ "unit": "short"
+ },
+ {
+ "alias": "Requests",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "Value #A",
+ "thresholds": [
+ ""
+ ],
+ "type": "number",
+ "unit": "ops"
+ },
+ {
+ "alias": "Errors",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "Value #B",
+ "thresholds": [],
+ "type": "number",
+ "unit": "ops"
+ },
+ {
+ "alias": "P50 Latency",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 0,
+ "link": false,
+ "pattern": "Value #C",
+ "thresholds": [],
+ "type": "number",
+ "unit": "dtdurations"
+ },
+ {
+ "alias": "P90 Latency",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 0,
+ "pattern": "Value #D",
+ "thresholds": [],
+ "type": "number",
+ "unit": "dtdurations"
+ },
+ {
+ "alias": "P99 Latency",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 0,
+ "pattern": "Value #E",
+ "thresholds": [],
+ "type": "number",
+ "unit": "dtdurations"
+ },
+ {
+ "alias": "IN",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "Value #F",
+ "thresholds": [
+ ""
+ ],
+ "type": "number",
+ "unit": "Bps"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "pattern": "Time",
+ "thresholds": [],
+ "type": "hidden",
+ "unit": "short"
+ },
+ {
+ "alias": "OUT",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "mappingType": 1,
+ "pattern": "Value #G",
+ "thresholds": [],
+ "type": "number",
+ "unit": "Bps"
+ }
+ ],
+ "targets": [
+ {
+ "expr": "histogram_quantile(0.50, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (le, ingress))",
+ "format": "table",
+ "hide": false,
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "{{ ingress }}",
+ "refId": "C"
+ },
+ {
+ "expr": "histogram_quantile(0.90, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (le, ingress))",
+ "format": "table",
+ "hide": false,
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "{{ ingress }}",
+ "refId": "D"
+ },
+ {
+ "expr": "histogram_quantile(0.99, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (le, ingress))",
+ "format": "table",
+ "hide": false,
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "{{ destination_service }}",
+ "refId": "E"
+ },
+ {
+ "expr": "sum(irate(nginx_ingress_controller_request_size_sum{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (ingress)",
+ "format": "table",
+ "hide": false,
+ "instant": true,
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "{{ ingress }}",
+ "refId": "F"
+ },
+ {
+ "expr": "sum(irate(nginx_ingress_controller_response_size_sum{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (ingress)",
+ "format": "table",
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "{{ ingress }}",
+ "refId": "G"
+ }
+ ],
+ "timeFrom": null,
+ "title": "Ingress Percentile Response Times and Transfer Rates",
+ "transform": "table",
+ "type": "table"
+ },
+ {
+ "columns": [
+ {
+ "text": "Current",
+ "value": "current"
+ }
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "fontSize": "100%",
+ "gridPos": {
+ "h": 8,
+ "w": 24,
+ "x": 0,
+ "y": 24
+ },
+ "height": "1024",
+ "id": 85,
+ "links": [],
+ "options": {},
+ "pageSize": 7,
+ "scroll": true,
+ "showHeader": true,
+ "sort": {
+ "col": 1,
+ "desc": false
+ },
+ "styles": [
+ {
+ "alias": "Time",
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "pattern": "Time",
+ "type": "date"
+ },
+ {
+ "alias": "TTL",
+ "colorMode": "cell",
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 0,
+ "pattern": "Current",
+ "thresholds": [
+ "0",
+ "691200"
+ ],
+ "type": "number",
+ "unit": "s"
+ },
+ {
+ "alias": "",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "decimals": 2,
+ "pattern": "/.*/",
+ "thresholds": [],
+ "type": "number",
+ "unit": "short"
+ }
+ ],
+ "targets": [
+ {
+ "expr": "avg(nginx_ingress_controller_ssl_expire_time_seconds{pod=~\"$controller\",service_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}) by (host) - time()",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{ host }}",
+ "metric": "gke_letsencrypt_cert_expiration",
+ "refId": "A",
+ "step": 1
+ }
+ ],
+ "title": "Ingress Certificate Expiry",
+ "transform": "timeseries_aggregations",
+ "type": "table"
+ }
+ ],
+ "refresh": "5s",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "nginx"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": ".*",
+ "current": {
+ "text": "All",
+ "value": "$__all"
+ },
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nginx_ingress_controller_config_hash{nc_region=~\"$region\"}, controller_namespace)",
+ "hide": 0,
+ "includeAll": true,
+ "label": "Namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(nginx_ingress_controller_config_hash{nc_region=~\"$region\"}, controller_namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": ".*",
+ "current": {
+ "text": "All",
+ "value": "$__all"
+ },
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": true,
+ "label": "Controller Class",
+ "multi": false,
+ "name": "controller_class",
+ "options": [],
+ "query": "label_values(nginx_ingress_controller_config_hash{service_namespace=~\"$namespace\",nc_region=~\"$region\"}, controller_class) ",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": ".*",
+ "current": {
+ "text": "All",
+ "value": "$__all"
+ },
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": true,
+ "label": "Controller",
+ "multi": false,
+ "name": "controller",
+ "options": [],
+ "query": "label_values(nginx_ingress_controller_config_hash{service_namespace=~\"$namespace\",controller_class=~\"$controller_class\",nc_region=~\"$region\"}, controller_pod) ",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": ".*",
+ "current": {
+ "text": "All",
+ "value": "$__all"
+ },
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "label_values(nginx_ingress_controller_requests{service_namespace=~\"$namespace\",controller_class=~\"$controller_class\",controller=~\"$controller\",nc_region=~\"$region\"}, ingress) ",
+ "hide": 0,
+ "includeAll": true,
+ "label": "Ingress",
+ "multi": false,
+ "name": "ingress",
+ "options": [],
+ "query": "label_values(nginx_ingress_controller_requests{service_namespace=~\"$namespace\",controller_class=~\"$controller_class\",controller=~\"$controller\",nc_region=~\"$region\"}, ingress) ",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 2,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "2m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "NGINX Ingress controller",
+ "uid": "nginx",
+ "version": 3
+ }
+ persistent-volume: |-
+ {
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 119,
+ "links": [],
+ "panels": [
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 18,
+ "x": 0,
+ "y": 0
+ },
+ "id": 2,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": true,
+ "min": true,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "(sum without(instance, node) (kubelet_volume_stats_capacity_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"}) - sum without(instance, node) (kubelet_volume_stats_available_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"}))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Used Space ",
+ "refId": "A"
+ },
+ {
+ "expr": "sum without(instance, node) (kubelet_volume_stats_available_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Free Space",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Volume Space Usage",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "datasource": "prometheus",
+ "gridPos": {
+ "h": 9,
+ "w": 6,
+ "x": 18,
+ "y": 0
+ },
+ "id": 5,
+ "links": [],
+ "options": {
+ "fieldOptions": {
+ "calcs": [
+ "mean"
+ ],
+ "defaults": {
+ "max": 100,
+ "min": 0,
+ "unit": "percent"
+ },
+ "mappings": [
+ {
+ "from": "",
+ "id": 1,
+ "operator": "",
+ "text": "",
+ "to": "",
+ "type": 1,
+ "value": ""
+ }
+ ],
+ "override": {},
+ "thresholds": [
+ {
+ "color": "green",
+ "index": 0,
+ "value": null
+ },
+ {
+ "color": "red",
+ "index": 1,
+ "value": 80
+ }
+ ],
+ "values": false
+ },
+ "orientation": "auto",
+ "showThresholdLabels": true,
+ "showThresholdMarkers": true
+ },
+ "pluginVersion": "6.2.0",
+ "targets": [
+ {
+ "expr": "(kubelet_volume_stats_capacity_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"} - kubelet_volume_stats_available_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"}) / kubelet_volume_stats_capacity_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"} * 100",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "timeFrom": null,
+ "timeShift": null,
+ "title": "Volume Space Usage",
+ "type": "gauge"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "fill": 1,
+ "gridPos": {
+ "h": 9,
+ "w": 18,
+ "x": 0,
+ "y": 9
+ },
+ "id": 3,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": true,
+ "min": true,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum without(instance, node) (kubelet_volume_stats_inodes_used{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Used Space ",
+ "refId": "A"
+ },
+ {
+ "expr": "(\n sum without(instance, node) (kubelet_volume_stats_inodes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"})\n -\n sum without(instance, node) (kubelet_volume_stats_inodes_used{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"})\n)",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{nc_region}} Free Space",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Volume inode Usage",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "datasource": "prometheus",
+ "gridPos": {
+ "h": 9,
+ "w": 6,
+ "x": 18,
+ "y": 9
+ },
+ "id": 6,
+ "links": [],
+ "options": {
+ "fieldOptions": {
+ "calcs": [
+ "mean"
+ ],
+ "defaults": {
+ "max": 100,
+ "min": 0,
+ "unit": "percent"
+ },
+ "mappings": [
+ {
+ "from": "",
+ "id": 1,
+ "operator": "",
+ "text": "",
+ "to": "",
+ "type": 1,
+ "value": ""
+ }
+ ],
+ "override": {},
+ "thresholds": [
+ {
+ "color": "green",
+ "index": 0,
+ "value": null
+ },
+ {
+ "color": "red",
+ "index": 1,
+ "value": 80
+ }
+ ],
+ "values": false
+ },
+ "orientation": "auto",
+ "showThresholdLabels": true,
+ "showThresholdMarkers": true
+ },
+ "pluginVersion": "6.2.0",
+ "targets": [
+ {
+ "expr": "kubelet_volume_stats_inodes_used{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"} / kubelet_volume_stats_inodes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"} * 100",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "timeFrom": null,
+ "timeShift": null,
+ "title": "Volume inode Usage",
+ "type": "gauge"
+ }
+ ],
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(kubelet_volume_stats_capacity_bytes{ job=\"kubelet\", nc_region=\"$region\"}, namespace)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(kubelet_volume_stats_capacity_bytes{ job=\"kubelet\", nc_region=\"$region\"}, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(kubelet_volume_stats_capacity_bytes{ job=\"kubelet\", namespace=\"$namespace\"}, persistentvolumeclaim)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "PersistentVolumeClaim",
+ "multi": false,
+ "name": "volume",
+ "options": [],
+ "query": "label_values(kubelet_volume_stats_capacity_bytes{ job=\"kubelet\", namespace=\"$namespace\"}, persistentvolumeclaim)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Kubernetes Persistent Volume",
+ "uid": "persistent-volume",
+ "version": 1
+ }
+ elasticsearch: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Elasticsearch detailed dashboard",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": 4358,
+ "graphTooltip": 1,
+ "id": 206,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 50,
+ "panels": [],
+ "repeat": null,
+ "title": "Cluster",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "#FADE2A",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 10,
+ "x": 0,
+ "y": 1
+ },
+ "height": "50",
+ "id": 8,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "(sum(elasticsearch_cluster_health_status{cluster=~\"$region\",color=\"green\",nc_region=~\"$region\"})*2)+sum(elasticsearch_cluster_health_status{cluster=~\"$region\",color=\"yellow\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 3,
+ "legendFormat": "",
+ "metric": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "0,2",
+ "title": "Cluster health status",
+ "type": "singlestat",
+ "valueFontSize": "110%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "GREEN",
+ "value": "2"
+ },
+ {
+ "op": "=",
+ "text": "YELLOW",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "RED",
+ "value": "0"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 10,
+ "y": 1
+ },
+ "height": "50",
+ "id": 10,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(elasticsearch_cluster_health_number_of_nodes{cluster=~\"$region\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "metric": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "",
+ "title": "Nodes",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 14,
+ "y": 1
+ },
+ "height": "50",
+ "id": 9,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "elasticsearch_cluster_health_number_of_data_nodes{cluster=\"$region\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "metric": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "",
+ "title": "Data nodes",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 6,
+ "x": 18,
+ "y": 1
+ },
+ "height": "50",
+ "hideTimeOverride": true,
+ "id": 16,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "elasticsearch_cluster_health_number_of_pending_tasks{cluster=\"$region\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "metric": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "",
+ "title": "Pending tasks",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 4
+ },
+ "id": 51,
+ "panels": [],
+ "repeat": null,
+ "title": "Shards",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 0,
+ "y": 5
+ },
+ "height": "50",
+ "id": 11,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "maxPerRow": 6,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "repeat": "shard_type",
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "elasticsearch_cluster_health_active_primary_shards{cluster=\"$region\",nc_region=~\"$region\"}",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "",
+ "title": "active primary shards",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 4,
+ "y": 5
+ },
+ "height": "50",
+ "id": 39,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "maxPerRow": 6,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "elasticsearch_cluster_health_active_shards{cluster=\"$region\",nc_region=~\"$region\"}",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "",
+ "title": "active shards",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 8,
+ "y": 5
+ },
+ "height": "50",
+ "id": 40,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "maxPerRow": 6,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "elasticsearch_cluster_health_initializing_shards{cluster=\"$region\",nc_region=~\"$region\"}",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "",
+ "title": "initializing shards",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 12,
+ "y": 5
+ },
+ "height": "50",
+ "id": 41,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "maxPerRow": 6,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "elasticsearch_cluster_health_relocating_shards{cluster=\"$region\",nc_region=~\"$region\"}",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "",
+ "title": "relocating shards",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 4,
+ "x": 16,
+ "y": 5
+ },
+ "height": "50",
+ "id": 42,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "maxPerRow": 6,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "elasticsearch_cluster_health_unassigned_shards{cluster=\"$region\",nc_region=~\"$region\"}",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 40
+ }
+ ],
+ "thresholds": "",
+ "title": "unassigned shards",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 8
+ },
+ "id": 52,
+ "panels": [],
+ "repeat": null,
+ "title": "System",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 0,
+ "y": 9
+ },
+ "height": "400",
+ "id": 30,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "elasticsearch_os_cpu_percent{cluster=\"$region\",es_master_node=\"true\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "instant": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - master",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "elasticsearch_os_cpu_percent{cluster=\"$region\",es_data_node=\"true\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - data",
+ "metric": "",
+ "refId": "B",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "CPU usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "percent",
+ "label": "CPU usage",
+ "logBase": 1,
+ "max": 100,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 6,
+ "y": 9
+ },
+ "height": "400",
+ "id": 31,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "elasticsearch_jvm_memory_used_bytes{cluster=\"$region\",name=~\"$node\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - used: {{area}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ },
+ {
+ "expr": "elasticsearch_jvm_memory_committed_bytes{cluster=\"$region\",name=~\"$node\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - committed: {{area}}",
+ "refId": "B",
+ "step": 10
+ },
+ {
+ "expr": "elasticsearch_jvm_memory_max_bytes{cluster=\"$region\",name=~\"$node\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - max: {{area}}",
+ "refId": "C",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "JVM memory usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": "Memory",
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 12,
+ "y": 9
+ },
+ "height": "400",
+ "id": 32,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "1-(elasticsearch_filesystem_data_available_bytes{cluster=\"$region\",nc_region=~\"$region\"}/elasticsearch_filesystem_data_size_bytes{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - {{path}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [
+ {
+ "colorMode": "custom",
+ "fill": true,
+ "fillColor": "rgba(216, 200, 27, 0.27)",
+ "op": "gt",
+ "value": 0.8
+ },
+ {
+ "colorMode": "custom",
+ "fill": true,
+ "fillColor": "rgba(234, 112, 112, 0.22)",
+ "op": "gt",
+ "value": 0.9
+ }
+ ],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Disk usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "percentunit",
+ "label": "Disk Usage %",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 18,
+ "y": 9
+ },
+ "height": "400",
+ "id": 47,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "sort": "max",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "sent",
+ "transform": "negative-Y"
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "irate(elasticsearch_transport_tx_size_bytes_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} -sent",
+ "refId": "D",
+ "step": 10
+ },
+ {
+ "expr": "irate(elasticsearch_transport_rx_size_bytes_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} -received",
+ "refId": "C",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Network usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": "Bytes/sec",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "pps",
+ "label": "",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 19
+ },
+ "id": 53,
+ "panels": [],
+ "repeat": null,
+ "title": "Documents",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 0,
+ "y": 20
+ },
+ "height": "400",
+ "id": 1,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "elasticsearch_indices_docs{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Documents count",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "Documents",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 6,
+ "y": 20
+ },
+ "height": "400",
+ "id": 24,
+ "interval": "",
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_indices_indexing_index_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Documents indexed rate",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "index calls/s",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 12,
+ "y": 20
+ },
+ "height": "400",
+ "id": 25,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_indices_docs_deleted{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Documents deleted rate",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "Documents/s",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 18,
+ "y": 20
+ },
+ "height": "400",
+ "id": 26,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_indices_merges_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Documents merged rate",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "Documents/s",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 30
+ },
+ "id": 54,
+ "panels": [],
+ "repeat": null,
+ "title": "Total Operations stats",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 12,
+ "x": 0,
+ "y": 31
+ },
+ "height": "400",
+ "id": 48,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "irate(elasticsearch_indices_indexing_index_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - indexing",
+ "metric": "",
+ "refId": "A",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_search_query_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - query",
+ "refId": "B",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_search_fetch_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - fetch",
+ "refId": "C",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_merges_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - merges",
+ "refId": "D",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_refresh_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - refresh",
+ "refId": "E",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_flush_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - flush",
+ "refId": "F",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Total Operations rate",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "Operations/s",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 12,
+ "x": 12,
+ "y": 31
+ },
+ "height": "400",
+ "id": 49,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "irate(elasticsearch_indices_indexing_index_time_seconds_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - indexing",
+ "metric": "",
+ "refId": "A",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_search_query_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - query",
+ "refId": "B",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_search_fetch_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - fetch",
+ "refId": "C",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_merges_total_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - merges",
+ "refId": "D",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_refresh_total_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - refresh",
+ "refId": "E",
+ "step": 4
+ },
+ {
+ "expr": "irate(elasticsearch_indices_flush_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ name }} - flush",
+ "refId": "F",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Total Operations time",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "ms",
+ "label": "Time",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 41
+ },
+ "id": 55,
+ "panels": [],
+ "repeat": null,
+ "title": "Times",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 8,
+ "x": 0,
+ "y": 42
+ },
+ "height": "400",
+ "id": 33,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_indices_search_query_time_seconds{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval]) ",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Query time",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "ms",
+ "label": "Time",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 8,
+ "x": 8,
+ "y": 42
+ },
+ "height": "400",
+ "id": 5,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_indices_indexing_index_time_seconds_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Indexing time",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "ms",
+ "label": "Time",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 8,
+ "x": 16,
+ "y": 42
+ },
+ "height": "400",
+ "id": 3,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_indices_merges_total_time_seconds_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Merging time",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": "Time",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 52
+ },
+ "id": 56,
+ "panels": [],
+ "repeat": null,
+ "title": "Caches",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 0,
+ "y": 53
+ },
+ "height": "400",
+ "id": 4,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "elasticsearch_indices_fielddata_memory_size_bytes{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Field data memory size",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": "Memory",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 6,
+ "y": 53
+ },
+ "height": "400",
+ "id": 34,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_indices_fielddata_evictions{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Field data evictions",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "Evictions/s",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 12,
+ "y": 53
+ },
+ "height": "400",
+ "id": 35,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "elasticsearch_indices_query_cache_memory_size_bytes{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Query cache size",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": "Size",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 6,
+ "x": 18,
+ "y": 53
+ },
+ "height": "400",
+ "id": 36,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_indices_query_cache_evictions{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Query cache evictions",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "Evictions/s",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 63
+ },
+ "id": 57,
+ "panels": [],
+ "repeat": null,
+ "title": "Thread Pool",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 19,
+ "w": 6,
+ "x": 0,
+ "y": 64
+ },
+ "id": 45,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "max": true,
+ "min": true,
+ "show": true,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": " irate(elasticsearch_thread_pool_rejected_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}} - {{ type }}",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Thread Pool operations rejected",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 19,
+ "w": 6,
+ "x": 6,
+ "y": 64
+ },
+ "id": 46,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "max": true,
+ "min": true,
+ "show": true,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "elasticsearch_thread_pool_active_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}} - {{ type }}",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Thread Pool operations queued",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 19,
+ "w": 6,
+ "x": 12,
+ "y": 64
+ },
+ "height": "",
+ "id": 43,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "max": true,
+ "min": true,
+ "show": true,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "elasticsearch_thread_pool_active_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}} - {{ type }}",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Thread Pool threads active",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 19,
+ "w": 6,
+ "x": 18,
+ "y": 64
+ },
+ "id": 44,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "max": true,
+ "min": true,
+ "show": true,
+ "sort": "avg",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "irate(elasticsearch_thread_pool_completed_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}} - {{ type }}",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Thread Pool operations completed",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 83
+ },
+ "id": 58,
+ "panels": [],
+ "repeat": null,
+ "title": "JVM Garbage Collection",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 12,
+ "x": 0,
+ "y": 84
+ },
+ "height": "400",
+ "id": 7,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_jvm_gc_collection_seconds_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}} - {{gc}}",
+ "metric": "",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "GC count",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "GCs",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 10,
+ "w": 12,
+ "x": 12,
+ "y": 84
+ },
+ "height": "400",
+ "id": 27,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": true,
+ "min": true,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(elasticsearch_jvm_gc_collection_seconds_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}} - {{gc}}",
+ "metric": "",
+ "refId": "A",
+ "step": 4
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "GC time",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": "Time",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "30s",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "elasticsearch",
+ "App"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": ".+",
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {
+ "text": "All",
+ "value": [
+ "$__all"
+ ]
+ },
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(elasticsearch_process_cpu_percent{nc_region=~\"$region\"},name)",
+ "hide": 0,
+ "includeAll": true,
+ "label": "Node",
+ "multi": true,
+ "name": "node",
+ "options": [],
+ "query": "label_values(elasticsearch_process_cpu_percent{nc_region=~\"$region\"},name)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 1,
+ "tagValuesQuery": null,
+ "tags": [],
+ "tagsQuery": null,
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "auto": true,
+ "auto_count": 30,
+ "auto_min": "10s",
+ "current": {
+ "text": "1h",
+ "value": "1h"
+ },
+ "hide": 0,
+ "label": "Interval",
+ "name": "interval",
+ "options": [
+ {
+ "selected": false,
+ "text": "auto",
+ "value": "$__auto_interval_interval"
+ },
+ {
+ "selected": false,
+ "text": "1m",
+ "value": "1m"
+ },
+ {
+ "selected": false,
+ "text": "10m",
+ "value": "10m"
+ },
+ {
+ "selected": false,
+ "text": "30m",
+ "value": "30m"
+ },
+ {
+ "selected": true,
+ "text": "1h",
+ "value": "1h"
+ },
+ {
+ "selected": false,
+ "text": "6h",
+ "value": "6h"
+ },
+ {
+ "selected": false,
+ "text": "12h",
+ "value": "12h"
+ },
+ {
+ "selected": false,
+ "text": "1d",
+ "value": "1d"
+ },
+ {
+ "selected": false,
+ "text": "7d",
+ "value": "7d"
+ },
+ {
+ "selected": false,
+ "text": "14d",
+ "value": "14d"
+ },
+ {
+ "selected": false,
+ "text": "30d",
+ "value": "30d"
+ }
+ ],
+ "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d",
+ "refresh": 2,
+ "skipUrlSync": false,
+ "type": "interval"
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Elasticsearch",
+ "uid": "elasticsearch",
+ "version": 8
+ }
+ fluentd: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 182,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 29,
+ "panels": [],
+ "title": "Buffer Overview",
+ "type": "row"
+ },
+ {
+ "columns": [],
+ "datasource": "${DS_PROMETHEUS}",
+ "fontSize": "100%",
+ "gridPos": {
+ "h": 20,
+ "w": 12,
+ "x": 0,
+ "y": 1
+ },
+ "id": 27,
+ "links": [],
+ "options": {},
+ "pageSize": null,
+ "pluginVersion": "6.2.0",
+ "scroll": true,
+ "showHeader": true,
+ "sort": {
+ "col": 1,
+ "desc": false
+ },
+ "styles": [
+ {
+ "alias": "Time",
+ "colorMode": null,
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 2,
+ "mappingType": 1,
+ "pattern": "Time",
+ "thresholds": [],
+ "type": "hidden",
+ "unit": "short"
+ },
+ {
+ "alias": "local_elasticsearch",
+ "colorMode": "value",
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 0,
+ "mappingType": 1,
+ "pattern": "Value #A",
+ "thresholds": [
+ "50",
+ "90"
+ ],
+ "type": "number",
+ "unit": "short"
+ },
+ {
+ "alias": "centralized_logging",
+ "colorMode": "value",
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 0,
+ "mappingType": 1,
+ "pattern": "Value #B",
+ "thresholds": [
+ "50",
+ "90"
+ ],
+ "type": "number",
+ "unit": "short"
+ },
+ {
+ "alias": "dmaap",
+ "colorMode": "value",
+ "colors": [
+ "rgba(245, 54, 54, 0.9)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(50, 172, 45, 0.97)"
+ ],
+ "dateFormat": "YYYY-MM-DD HH:mm:ss",
+ "decimals": 0,
+ "mappingType": 1,
+ "pattern": "Value #C",
+ "thresholds": [
+ "50",
+ "90"
+ ],
+ "type": "number",
+ "unit": "short"
+ }
+ ],
+ "targets": [
+ {
+ "expr": "sum by (node) (fluentd_output_status_buffer_available_space_ratio{plugin_id=\"local_elasticsearch_output\",node=~\"$node\",nc_region=~\"$region\"})",
+ "format": "table",
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ },
+ {
+ "expr": "sum by (node) (fluentd_output_status_buffer_available_space_ratio{plugin_id=\"centralized_logging_output\",node=~\"$node\",nc_region=~\"$region\"})",
+ "format": "table",
+ "hide": false,
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "B"
+ },
+ {
+ "expr": "sum by (node) (fluentd_output_status_buffer_available_space_ratio{plugin_id=\"dmaap_output\",node=~\"$node\",nc_region=~\"$region\"})",
+ "format": "table",
+ "hide": false,
+ "instant": true,
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "C"
+ }
+ ],
+ "timeFrom": null,
+ "timeShift": null,
+ "title": "Remaining Buffer Space Available (%)",
+ "transform": "table",
+ "type": "table"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 1,
+ "fill": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 12,
+ "x": 12,
+ "y": 1
+ },
+ "id": 23,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by (node) (fluentd_output_status_buffer_queue_length{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Chunks Queued for $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 0,
+ "format": "short",
+ "label": "Chunks in Buffer",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "description": "",
+ "fill": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 12,
+ "x": 12,
+ "y": 11
+ },
+ "id": 34,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by (node) (rate(fluentd_output_status_flush_time_count{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[5m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Time to Send a Chunk to $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 0,
+ "format": "ms",
+ "label": "Flush Time",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 12,
+ "x": 0,
+ "y": 21
+ },
+ "id": 25,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "avg by (node) (fluentd_output_status_buffer_total_bytes{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Queue Size for $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 2,
+ "format": "decbytes",
+ "label": "",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "description": "",
+ "fill": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 12,
+ "x": 12,
+ "y": 21
+ },
+ "id": 36,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by (node) (rate(fluentd_output_status_write_count{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[5m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Chunks Sent per Second to $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 2,
+ "format": "short",
+ "label": "Chunks Sent per Second",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 0,
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 31
+ },
+ "id": 22,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": false,
+ "min": true,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": false,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "avg by (node, plugin_id) (fluentd_output_status_buffer_available_space_ratio{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Remaining Buffer Space % for $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 1,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 0,
+ "format": "short",
+ "label": "Remaining Buffer Space (%)",
+ "logBase": 1,
+ "max": "100",
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 38
+ },
+ "id": 31,
+ "panels": [],
+ "title": "Errors and Retries",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "cacheTimeout": null,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "fill": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 8,
+ "x": 0,
+ "y": 39
+ },
+ "id": 24,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by (node) (rate(fluentd_output_status_num_errors{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Output Error Rate for $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 2,
+ "format": "short",
+ "label": "Errors Per Second",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "cacheTimeout": null,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "fill": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 8,
+ "x": 8,
+ "y": 39
+ },
+ "id": 35,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by (node) (rate(fluentd_output_status_retry_count{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Output Retry Rate for $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 2,
+ "format": "short",
+ "label": "Retries Per Second",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "cacheTimeout": null,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "fill": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 8,
+ "x": 16,
+ "y": 39
+ },
+ "id": 37,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by (node) (rate(fluentd_output_status_slow_flush_count{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Slow Flushes to $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 2,
+ "format": "short",
+ "label": "Slow Flushes",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 47
+ },
+ "id": 15,
+ "panels": [],
+ "title": "Input / Output Statistics",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 0,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 0,
+ "y": 48
+ },
+ "id": 12,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by ($aggregator) (rate(fluentd_read_count{node=~\"$node\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{$aggregator}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Message Input Rate by $aggregator on Node(s): $node",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 1,
+ "format": "short",
+ "label": "Lines Read Per Second",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 0,
+ "gridPos": {
+ "h": 9,
+ "w": 12,
+ "x": 12,
+ "y": 48
+ },
+ "id": 13,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by ($aggregator) (rate([[destination]]_output_count{node=~\"$node\",nc_region=~\"$region\"}[2m]))",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{$aggregator}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Output Queuing Rate by $aggregator on Node(s): $node for $destination",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": 1,
+ "format": "short",
+ "label": "Lines Queued Per Second",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "30s",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "fluentd"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": ".+",
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": ".*",
+ "current": {
+ "text": "All",
+ "value": [
+ "$__all"
+ ]
+ },
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(fluentd_read_count{nc_region=~\"$region\"},node)",
+ "hide": 0,
+ "includeAll": true,
+ "label": "Node",
+ "multi": true,
+ "name": "node",
+ "options": [],
+ "query": "label_values(fluentd_read_count{nc_region=~\"$region\"},node)",
+ "refresh": 1,
+ "regex": ".*r[\\d]{2}[co]{1}[\\d]{3}",
+ "skipUrlSync": false,
+ "sort": 1,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {
+ "text": "local_elasticsearch",
+ "value": "local_elasticsearch"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Output Buffer",
+ "multi": false,
+ "name": "destination",
+ "options": [
+ {
+ "selected": true,
+ "text": "local_elasticsearch",
+ "value": "local_elasticsearch"
+ },
+ {
+ "selected": false,
+ "text": "centralized_logging",
+ "value": "centralized_logging"
+ },
+ {
+ "selected": false,
+ "text": "dmaap",
+ "value": "dmaap"
+ }
+ ],
+ "query": "local_elasticsearch,centralized_logging,dmaap",
+ "skipUrlSync": false,
+ "type": "custom"
+ },
+ {
+ "allValue": null,
+ "current": {
+ "text": "tag",
+ "value": "tag"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Group I/O Rate by Label",
+ "multi": false,
+ "name": "aggregator",
+ "options": [
+ {
+ "selected": false,
+ "text": "node",
+ "value": "node"
+ },
+ {
+ "selected": false,
+ "text": "region",
+ "value": "region"
+ },
+ {
+ "selected": false,
+ "text": "node_fqdn",
+ "value": "node_fqdn"
+ },
+ {
+ "selected": true,
+ "text": "tag",
+ "value": "tag"
+ },
+ {
+ "selected": false,
+ "text": "index_prefix",
+ "value": "index_prefix"
+ }
+ ],
+ "query": "node,region,node_fqdn,tag,index_prefix",
+ "skipUrlSync": false,
+ "type": "custom"
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Fluentd",
+ "uid": "fluentd",
+ "version": 2
+ }
+ idrac: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Dashboard to get an overview of one server",
+ "editable": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 95,
+ "iteration": 1644114779535,
+ "links": [],
+ "panels": [
+ {
+ "cacheTimeout": null,
+ "datasource": "${DS_PROMETHEUS}",
+ "fieldConfig": {
+ "defaults": {
+ "color": {
+ "mode": "thresholds"
+ },
+ "mappings": [
+ {
+ "id": 0,
+ "op": "=",
+ "text": "N/A",
+ "type": 1,
+ "value": "null"
+ },
+ {
+ "id": 1,
+ "op": "=",
+ "text": "Not Synchronized",
+ "type": 1,
+ "value": "0"
+ },
+ {
+ "id": 2,
+ "op": "=",
+ "text": "OK",
+ "type": 1,
+ "value": "1"
+ }
+ ],
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "#d44a3a",
+ "value": null
+ },
+ {
+ "color": "rgba(237, 129, 40, 0.89)",
+ "value": 0
+ },
+ {
+ "color": "#299c46",
+ "value": 1
+ }
+ ]
+ },
+ "unit": "none"
+ },
+ "overrides": []
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 0,
+ "y": 0
+ },
+ "id": 20,
+ "interval": null,
+ "links": [],
+ "maxDataPoints": 100,
+ "options": {
+ "colorMode": "value",
+ "graphMode": "none",
+ "justifyMode": "auto",
+ "orientation": "horizontal",
+ "reduceOptions": {
+ "calcs": [
+ "lastNotNull"
+ ],
+ "fields": "",
+ "values": false
+ },
+ "text": {},
+ "textMode": "auto"
+ },
+ "pluginVersion": "7.5.11",
+ "targets": [
+ {
+ "expr": "idrac_licensestatus_ok{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "title": "iDRAC License Status for $node",
+ "transformations": [
+ {
+ "id": "reduce",
+ "options": {
+ "reducers": [
+ "lastNotNull"
+ ]
+ }
+ }
+ ],
+ "type": "stat"
+ },
+ {
+ "datasource": "${DS_PROMETHEUS}",
+ "fieldConfig": {
+ "defaults": {
+ "color": {
+ "mode": "thresholds"
+ },
+ "custom": {
+ "align": "center",
+ "displayMode": "color-background",
+ "filterable": false
+ },
+ "mappings": [],
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "rgb(37, 48, 34)",
+ "value": null
+ },
+ {
+ "color": "rgb(206, 14, 36)",
+ "value": 0
+ },
+ {
+ "color": "#EAB839",
+ "value": 480
+ },
+ {
+ "color": "light-green",
+ "value": 840
+ }
+ ]
+ }
+ },
+ "overrides": []
+ },
+ "gridPos": {
+ "h": 8,
+ "w": 6,
+ "x": 6,
+ "y": 0
+ },
+ "id": 41,
+ "options": {
+ "showHeader": false
+ },
+ "pluginVersion": "7.5.11",
+ "targets": [
+ {
+ "expr": "idrac_sensors_tachometer{name=~\"System_Board_Fan[0-9]+\",nc_region=\"$region\",node=\"$node\"}",
+ "format": "table",
+ "interval": "",
+ "legendFormat": "{{name}}",
+ "queryType": "randomWalk",
+ "refId": "A"
+ }
+ ],
+ "title": "System fan for $node",
+ "transformations": [
+ {
+ "id": "filterFieldsByName",
+ "options": {
+ "include": {
+ "names": [
+ "name",
+ "Value"
+ ]
+ }
+ }
+ },
+ {
+ "id": "groupBy",
+ "options": {
+ "fields": {
+ "Value": {
+ "aggregations": [
+ "mean"
+ ],
+ "operation": "aggregate"
+ },
+ "name": {
+ "aggregations": [],
+ "operation": "groupby"
+ }
+ }
+ }
+ }
+ ],
+ "type": "table"
+ },
+ {
+ "cacheTimeout": null,
+ "datasource": "${DS_PROMETHEUS}",
+ "fieldConfig": {
+ "defaults": {
+ "color": {
+ "mode": "thresholds"
+ },
+ "mappings": [
+ {
+ "id": 0,
+ "op": "=",
+ "text": "N/A",
+ "type": 1,
+ "value": "null"
+ }
+ ],
+ "max": 60,
+ "min": 0,
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "rgba(50, 172, 45, 0.97)",
+ "value": null
+ },
+ {
+ "color": "rgba(237, 129, 40, 0.89)",
+ "value": 43
+ },
+ {
+ "color": "rgba(245, 54, 54, 0.9)",
+ "value": 47
+ }
+ ]
+ },
+ "unit": "celsius"
+ },
+ "overrides": []
+ },
+ "gridPos": {
+ "h": 8,
+ "w": 6,
+ "x": 12,
+ "y": 0
+ },
+ "id": 32,
+ "interval": null,
+ "links": [],
+ "maxDataPoints": 100,
+ "options": {
+ "orientation": "horizontal",
+ "reduceOptions": {
+ "calcs": [
+ "lastNotNull"
+ ],
+ "fields": "",
+ "values": false
+ },
+ "showThresholdLabels": true,
+ "showThresholdMarkers": true,
+ "text": {}
+ },
+ "pluginVersion": "7.5.11",
+ "targets": [
+ {
+ "expr": "idrac_inlet_temp_in_celsius{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60,
+ "target": ""
+ }
+ ],
+ "title": "Inlet temperature of $node",
+ "transformations": [
+ {
+ "id": "reduce",
+ "options": {
+ "reducers": [
+ "lastNotNull"
+ ]
+ }
+ }
+ ],
+ "type": "gauge"
+ },
+ {
+ "cacheTimeout": null,
+ "datasource": "${DS_PROMETHEUS}",
+ "fieldConfig": {
+ "defaults": {
+ "color": {
+ "mode": "thresholds"
+ },
+ "mappings": [
+ {
+ "id": 0,
+ "op": "=",
+ "text": "N/A",
+ "type": 1,
+ "value": "null"
+ }
+ ],
+ "max": 100,
+ "min": 0,
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "rgba(50, 172, 45, 0.97)",
+ "value": null
+ },
+ {
+ "color": "rgba(237, 129, 40, 0.89)",
+ "value": 75
+ },
+ {
+ "color": "rgba(245, 54, 54, 0.9)",
+ "value": 80
+ }
+ ]
+ },
+ "unit": "celsius"
+ },
+ "overrides": []
+ },
+ "gridPos": {
+ "h": 8,
+ "w": 6,
+ "x": 18,
+ "y": 0
+ },
+ "id": 7,
+ "interval": null,
+ "links": [],
+ "maxDataPoints": 100,
+ "options": {
+ "orientation": "horizontal",
+ "reduceOptions": {
+ "calcs": [
+ "lastNotNull"
+ ],
+ "fields": "",
+ "values": false
+ },
+ "showThresholdLabels": true,
+ "showThresholdMarkers": true,
+ "text": {}
+ },
+ "pluginVersion": "7.5.11",
+ "targets": [
+ {
+ "expr": "idrac_exhaust_temp_in_celsius{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60,
+ "target": ""
+ }
+ ],
+ "title": "Exhaust temperature of $node",
+ "transformations": [
+ {
+ "id": "reduce",
+ "options": {
+ "reducers": [
+ "lastNotNull"
+ ]
+ }
+ }
+ ],
+ "type": "gauge"
+ },
+ {
+ "datasource": "${DS_PROMETHEUS}",
+ "fieldConfig": {
+ "defaults": {
+ "color": {
+ "mode": "palette-classic"
+ },
+ "custom": {
+ "align": "center",
+ "displayMode": "auto",
+ "filterable": false
+ },
+ "mappings": [],
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "rgb(0, 0, 0)",
+ "value": null
+ }
+ ]
+ }
+ },
+ "overrides": []
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 6,
+ "x": 0,
+ "y": 4
+ },
+ "id": 45,
+ "interval": null,
+ "options": {
+ "showHeader": true
+ },
+ "pluginVersion": "7.5.11",
+ "targets": [
+ {
+ "exemplar": true,
+ "expr": "idrac_sensors_volts{name=~\"PS[0-9]+_Voltage_[0-9]+\",nc_region=\"$region\",node=\"$node\"}",
+ "format": "table",
+ "interval": "",
+ "legendFormat": "{{name}}",
+ "queryType": "randomWalk",
+ "refId": "A"
+ }
+ ],
+ "title": "Power supply for $node",
+ "transformations": [
+ {
+ "id": "filterFieldsByName",
+ "options": {
+ "include": {
+ "names": [
+ "name",
+ "health_state"
+ ]
+ }
+ }
+ },
+ {
+ "id": "organize",
+ "options": {
+ "excludeByName": {},
+ "indexByName": {
+ "health_state": 1,
+ "name": 0
+ },
+ "renameByName": {
+ "health_state": "Health Status",
+ "name": "Name"
+ }
+ }
+ },
+ {
+ "id": "groupBy",
+ "options": {
+ "fields": {
+ "Health Status": {
+ "aggregations": [
+ "last"
+ ],
+ "operation": "aggregate"
+ },
+ "Name": {
+ "aggregations": [],
+ "operation": "groupby"
+ }
+ }
+ }
+ }
+ ],
+ "type": "table"
+ },
+ {
+ "collapsed": false,
+ "datasource": null,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 8
+ },
+ "id": 38,
+ "panels": [],
+ "title": "Selected node metric",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fieldConfig": {
+ "defaults": {
+ "unit": "volt"
+ },
+ "overrides": [
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "node_memory_SwapFree{instance=\"$server\",job=\"prometheus\"}"
+ },
+ "properties": [
+ {
+ "id": "unit",
+ "value": "short"
+ }
+ ]
+ }
+ ]
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 7,
+ "w": 23,
+ "x": 0,
+ "y": 9
+ },
+ "hiddenSeries": false,
+ "id": 33,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "7.5.11",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "idrac_sensors_volts{name=~\"PS[0-9]+_Voltage_[0-9]+\",nc_region=\"$region\",node=\"$node\"}",
+ "format": "time_series",
+ "hide": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "{{name}}",
+ "metric": "",
+ "refId": "C",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Power supply for $node",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:1686",
+ "format": "volt",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "90",
+ "show": true
+ },
+ {
+ "$$hashKey": "object:1687",
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "datasource": "${DS_PROMETHEUS}",
+ "fieldConfig": {
+ "defaults": {
+ "color": {
+ "mode": "palette-classic"
+ },
+ "custom": {
+ "axisLabel": "",
+ "axisPlacement": "auto",
+ "barAlignment": 0,
+ "drawStyle": "line",
+ "fillOpacity": 13,
+ "gradientMode": "opacity",
+ "hideFrom": {
+ "graph": false,
+ "legend": false,
+ "tooltip": false
+ },
+ "lineInterpolation": "linear",
+ "lineStyle": {
+ "fill": "solid"
+ },
+ "lineWidth": 2,
+ "pointSize": 6,
+ "scaleDistribution": {
+ "type": "linear"
+ },
+ "showPoints": "auto",
+ "spanNulls": false
+ },
+ "mappings": [],
+ "min": 0,
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ },
+ {
+ "color": "red",
+ "value": 80
+ }
+ ]
+ },
+ "unit": "celsius"
+ },
+ "overrides": [
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "node_memory_SwapFree{instance=\"$server\",job=\"prometheus\"}"
+ },
+ "properties": [
+ {
+ "id": "unit",
+ "value": "short"
+ }
+ ]
+ }
+ ]
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 23,
+ "x": 0,
+ "y": 16
+ },
+ "id": 4,
+ "links": [],
+ "options": {
+ "graph": {},
+ "legend": {
+ "calcs": [],
+ "displayMode": "list",
+ "placement": "bottom"
+ },
+ "tooltipOptions": {
+ "mode": "single"
+ }
+ },
+ "pluginVersion": "7.4.5",
+ "targets": [
+ {
+ "expr": "idrac_inlet_temp_in_celsius{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "hide": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "inlet temp",
+ "metric": "",
+ "refId": "C",
+ "step": 10
+ },
+ {
+ "expr": "idrac_exhaust_temp_in_celsius{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "exhaust temp",
+ "metric": "",
+ "refId": "E",
+ "step": 10
+ }
+ ],
+ "timeFrom": null,
+ "timeShift": null,
+ "title": "Temperature for $node",
+ "type": "timeseries"
+ },
+ {
+ "alerting": {},
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fieldConfig": {
+ "defaults": {
+ "unit": "rotrpm"
+ },
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 8,
+ "w": 23,
+ "x": 0,
+ "y": 23
+ },
+ "hiddenSeries": false,
+ "id": 3,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "7.5.11",
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "idrac_sensors_tachometer{nc_region=\"$region\",node=\"$node\",name=~\"System_Board_Fan[0-9]+\"}",
+ "format": "time_series",
+ "hide": false,
+ "interval": "",
+ "intervalFactor": 10,
+ "legendFormat": "{{name}}",
+ "refId": "A",
+ "step": 50
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Fan speed for $node",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:2909",
+ "format": "rotrpm",
+ "label": "Fan speed",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "$$hashKey": "object:2910",
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "datasource": null,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 31
+ },
+ "id": 14,
+ "panels": [],
+ "title": "All Node iDrac metrics",
+ "type": "row"
+ },
+ {
+ "datasource": "${DS_PROMETHEUS}",
+ "fieldConfig": {
+ "defaults": {
+ "color": {
+ "mode": "thresholds"
+ },
+ "custom": {
+ "align": "center",
+ "displayMode": "color-background",
+ "filterable": true
+ },
+ "mappings": [
+ {
+ "from": "",
+ "id": 1,
+ "text": "OK",
+ "to": "",
+ "type": 1,
+ "value": "1"
+ },
+ {
+ "from": "",
+ "id": 2,
+ "text": "EXPIRED",
+ "to": "",
+ "type": 1,
+ "value": "0"
+ }
+ ],
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "rgb(37, 48, 34)",
+ "value": null
+ },
+ {
+ "color": "semi-dark-red",
+ "value": 0
+ },
+ {
+ "color": "light-green",
+ "value": 1
+ }
+ ]
+ }
+ },
+ "overrides": []
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 32
+ },
+ "id": 36,
+ "options": {
+ "showHeader": true,
+ "sortBy": []
+ },
+ "pluginVersion": "7.5.11",
+ "targets": [
+ {
+ "exemplar": true,
+ "expr": "idrac_licensestatus_ok{nc_region=\"$region\"}",
+ "format": "table",
+ "instant": false,
+ "interval": "",
+ "legendFormat": "",
+ "queryType": "randomWalk",
+ "refId": "A"
+ }
+ ],
+ "timeFrom": "1d",
+ "title": "License status per Node",
+ "transformations": [
+ {
+ "id": "filterFieldsByName",
+ "options": {
+ "include": {
+ "names": [
+ "node",
+ "Value #A",
+ "name"
+ ]
+ }
+ }
+ },
+ {
+ "id": "organize",
+ "options": {
+ "excludeByName": {},
+ "indexByName": {},
+ "renameByName": {
+ "Value #A": "Status",
+ "name": "License Name",
+ "node": "Node"
+ }
+ }
+ },
+ {
+ "id": "groupBy",
+ "options": {
+ "fields": {
+ "License Name": {
+ "aggregations": [
+ "last"
+ ],
+ "operation": "aggregate"
+ },
+ "Node": {
+ "aggregations": [],
+ "operation": "groupby"
+ },
+ "Status": {
+ "aggregations": [
+ "last"
+ ],
+ "operation": "aggregate"
+ }
+ }
+ }
+ }
+ ],
+ "type": "table"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "$DS_PROMETHEUS",
+ "fieldConfig": {
+ "defaults": {
+ "unit": "celsius"
+ },
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 24,
+ "x": 0,
+ "y": 39
+ },
+ "hiddenSeries": false,
+ "id": 12,
+ "interval": "",
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "maxPerRow": 2,
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "7.5.11",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "repeat": null,
+ "repeatDirection": "h",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "idrac_inlet_temp_in_celsius{nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": "1w",
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Inlet temperature of all nodes in $region",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:2130",
+ "format": "celsius",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "$$hashKey": "object:2131",
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "$DS_PROMETHEUS",
+ "fieldConfig": {
+ "defaults": {
+ "unit": "celsius"
+ },
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 24,
+ "x": 0,
+ "y": 49
+ },
+ "hiddenSeries": false,
+ "id": 43,
+ "interval": "",
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "maxPerRow": 2,
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "7.5.11",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "repeatDirection": "h",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "idrac_exhaust_temp_in_celsius{nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": "1w",
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Exhaust temperature of all nodes in $region",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:2130",
+ "format": "celsius",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "$$hashKey": "object:2131",
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "$DS_PROMETHEUS",
+ "fieldConfig": {
+ "defaults": {
+ "unit": "volt"
+ },
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 24,
+ "x": 0,
+ "y": 59
+ },
+ "hiddenSeries": false,
+ "id": 42,
+ "interval": "",
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "hideEmpty": true,
+ "hideZero": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "maxPerRow": 2,
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "7.5.11",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "repeatDirection": "h",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "exemplar": true,
+ "expr": "idrac_sensors_volts{name=~\"PS[0-9]+_Voltage_[0-9]+\",nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}} {{name}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": "1w",
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Power supply of all nodes in $region",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:2130",
+ "format": "volt",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "$$hashKey": "object:2131",
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "$DS_PROMETHEUS",
+ "fieldConfig": {
+ "defaults": {
+ "unit": "rotrpm"
+ },
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 10,
+ "w": 24,
+ "x": 0,
+ "y": 69
+ },
+ "hiddenSeries": false,
+ "id": 44,
+ "interval": "",
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": false,
+ "hideEmpty": true,
+ "hideZero": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "maxPerRow": 2,
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "7.5.11",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "repeatDirection": "h",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "exemplar": true,
+ "expr": "idrac_sensors_tachometer{nc_region=\"$region\",name=~\"System_Board_Fan[0-9]+\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}} {{name}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": "1w",
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Fan speed of all nodes in $region",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:2130",
+ "format": "rotrpm",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "$$hashKey": "object:2131",
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": false,
+ "schemaVersion": 27,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "selected": false,
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "description": null,
+ "error": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "queryValue": "",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "description": null,
+ "error": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": {
+ "query": "label_values(nc_region)",
+ "refId": "prometheus-region-Variable-Query"
+ },
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "label_values(node_uname_info{nc_region=\"$region\"}, node)",
+ "description": null,
+ "error": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "Node",
+ "multi": false,
+ "name": "node",
+ "options": [],
+ "query": {
+ "query": "label_values(node_uname_info{nc_region=\"$region\"}, node)",
+ "refId": "prometheus-node-Variable-Query"
+ },
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "IDRAC",
+ "uid": "7AovVvank",
+ "version": 1
+ }
+ named_processes: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Process metrics exported by https://github.com/ncabatoff/process-exporter.",
+ "editable": false,
+ "gnetId": 249,
+ "graphTooltip": 1,
+ "id": 77,
+ "links": [
+ {
+ "asDropdown": true,
+ "icon": "external link",
+ "includeVars": true,
+ "keepTime": true,
+ "tags": [
+ "OS"
+ ],
+ "title": "OS",
+ "type": "dashboards"
+ }
+ ],
+ "panels": [
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 0
+ },
+ "id": 1,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "namedprocess_namegroup_num_procs{groupname=~\"$processes\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{groupname}} - {{hostname}}",
+ "metric": "process_namegroup_num_procs",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "num processes",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 0
+ },
+ "id": 2,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(namedprocess_namegroup_cpu_system_seconds_total{groupname=~\"$processes\", nc_region=\"$nc_region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{groupname}} - {{hostname}}",
+ "metric": "process_namegroup_cpu_seconds_total",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "cpu",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 7
+ },
+ "id": 3,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(namedprocess_namegroup_read_bytes_total{groupname=~\"$processes\", nc_region=\"$nc_region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{groupname}} - {{hostname}}",
+ "metric": "namedprocess_namegroup_read_bytes_total",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "read bytes",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 7
+ },
+ "id": 4,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(namedprocess_namegroup_write_bytes_total{groupname=~\"$processes\", nc_region=\"$nc_region\"}[$interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{groupname}} - {{hostname}}",
+ "metric": "namedprocess_namegroup_read_bytes_total",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "write bytes",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "Bps",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 14
+ },
+ "id": 5,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "namedprocess_namegroup_memory_bytes{groupname=~\"$processes\", memtype=\"resident\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{groupname}} - {{hostname}}",
+ "metric": "namedprocess_namegroup_memory_bytes",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "resident memory",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 14
+ },
+ "id": 6,
+ "isNew": true,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "namedprocess_namegroup_memory_bytes{groupname=~\"$processes\", memtype=\"virtual\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{groupname}} - {{hostname}}",
+ "metric": "namedprocess_namegroup_memory_bytes",
+ "refId": "A",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "virtual memory",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "1m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "OS"
+ ],
+ "templating": {
+ "list": [
+ {
+ "auto": false,
+ "auto_count": 30,
+ "auto_min": "10s",
+ "current": {
+ "text": "10m",
+ "value": "10m"
+ },
+ "datasource": null,
+ "hide": 0,
+ "includeAll": false,
+ "label": "",
+ "multi": false,
+ "name": "interval",
+ "options": [
+ {
+ "selected": false,
+ "text": "1m",
+ "value": "1m"
+ },
+ {
+ "selected": false,
+ "text": "5m",
+ "value": "5m"
+ },
+ {
+ "selected": true,
+ "text": "10m",
+ "value": "10m"
+ },
+ {
+ "selected": false,
+ "text": "30m",
+ "value": "30m"
+ },
+ {
+ "selected": false,
+ "text": "1h",
+ "value": "1h"
+ },
+ {
+ "selected": false,
+ "text": "6h",
+ "value": "6h"
+ },
+ {
+ "selected": false,
+ "text": "12h",
+ "value": "12h"
+ },
+ {
+ "selected": false,
+ "text": "1d",
+ "value": "1d"
+ },
+ {
+ "selected": false,
+ "text": "7d",
+ "value": "7d"
+ },
+ {
+ "selected": false,
+ "text": "14d",
+ "value": "14d"
+ },
+ {
+ "selected": false,
+ "text": "30d",
+ "value": "30d"
+ }
+ ],
+ "query": "1m,5m,10m,30m,1h,6h,12h,1d,7d,14d,30d",
+ "refresh": 2,
+ "skipUrlSync": false,
+ "type": "interval"
+ },
+ {
+ "allValue": ".+",
+ "current": {
+ "selected": false,
+ "tags": [],
+ "text": "All",
+ "value": [
+ "$__all"
+ ]
+ },
+ "datasource": "prometheus",
+ "definition": "label_values(groupname)",
+ "hide": 0,
+ "includeAll": true,
+ "label": null,
+ "multi": true,
+ "name": "processes",
+ "options": [],
+ "query": "label_values(groupname)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "prometheus",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC_Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 1,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Named Processes",
+ "uid": "named-processes",
+ "version": 1
+ }
+ nodes: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Dashboard to get an overview of one server",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 128,
+ "links": [],
+ "panels": [
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorPrefix": true,
+ "colorValue": true,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 0,
+ "y": 0
+ },
+ "id": 30,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "$node =",
+ "prefixFontSize": "70%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "node_ntp_leap{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,3",
+ "timeFrom": null,
+ "timeShift": null,
+ "title": "Leap Second Status",
+ "type": "singlestat",
+ "valueFontSize": "70%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "add leap second at UTC midnight",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "delete leap second at UTC midnight",
+ "value": "2"
+ },
+ {
+ "op": "=",
+ "text": "unsynchronised",
+ "value": "3"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 4,
+ "y": 0
+ },
+ "id": 18,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "$node =",
+ "prefixFontSize": "70%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "sum(node_timex_pps_jitter_total{node=~\"$node\", nc_region=\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Jitter Count",
+ "type": "singlestat",
+ "valueFontSize": "70%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "total"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 8,
+ "y": 0
+ },
+ "id": 31,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "$node =",
+ "prefixFontSize": "70%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "node_ntp_stratum{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Stratum",
+ "type": "singlestat",
+ "valueFontSize": "70%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "percent",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": true,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 8,
+ "w": 6,
+ "x": 12,
+ "y": 0
+ },
+ "id": 5,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "100 * (1 - (node_memory_MemFree_bytes{hostname=\"$node\", nc_region=\"$region\"} + node_memory_Buffers_bytes{hostname=\"$node\", nc_region=\"$region\"} + node_memory_Cached_bytes{hostname=\"$node\", nc_region=\"$region\"}) / (node_memory_MemTotal_bytes{hostname=\"$node\", nc_region=\"$region\"} - (node_memory_HugePages_Total{hostname=\"$node\", nc_region=\"$region\"} * node_memory_Hugepagesize_bytes{hostname=\"$node\", nc_region=\"$region\"})))",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 60,
+ "target": ""
+ }
+ ],
+ "thresholds": "80, 90",
+ "title": "Memory usage of $host excluding the Hugepages",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "percentunit",
+ "gauge": {
+ "maxValue": 1,
+ "minValue": 0,
+ "show": true,
+ "thresholdLabels": true,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 8,
+ "w": 6,
+ "x": 18,
+ "y": 0
+ },
+ "id": 7,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "(sum(node_filesystem_size_bytes{device!~\"tmpfs|shm\",node=\"$node\", nc_region=\"$region\"}) - sum(node_filesystem_free_bytes{device!~\"tmpfs|shm\",node=\"$node\", nc_region=\"$region\"})) / sum(node_filesystem_size_bytes{device!~\"tmpfs|shm\",node=\"$node\", nc_region=\"$region\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "refId": "A",
+ "step": 60,
+ "target": ""
+ }
+ ],
+ "thresholds": "0.75, 0.90",
+ "title": "Disk space usage of $host",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorPrefix": true,
+ "colorValue": true,
+ "colors": [
+ "#d44a3a",
+ "rgba(237, 129, 40, 0.89)",
+ "#299c46"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 0,
+ "y": 4
+ },
+ "id": 20,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "$node =",
+ "prefixFontSize": "70%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "node_timex_sync_status{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Clock_Synchronization",
+ "type": "singlestat",
+ "valueFontSize": "70%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "Not Synchronized",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorPostfix": false,
+ "colorPrefix": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 4,
+ "w": 4,
+ "x": 4,
+ "y": 4
+ },
+ "id": 22,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "/ms",
+ "postfixFontSize": "50%",
+ "prefix": "$node =",
+ "prefixFontSize": "70%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": true,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "node_ntp_sanity{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Sanity Check",
+ "type": "singlestat",
+ "valueFontSize": "70%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 8
+ },
+ "id": 16,
+ "panels": [],
+ "title": "NTP Status",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 2,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 9
+ },
+ "id": 24,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "node_ntp_root_delay_seconds{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Node_ntp_root_delay_seconds",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "alerting": {},
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 9
+ },
+ "id": 9,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "node_load1{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 4,
+ "legendFormat": "load 1m",
+ "refId": "A",
+ "step": 20,
+ "target": ""
+ },
+ {
+ "expr": "node_load5{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 4,
+ "legendFormat": "load 5m",
+ "refId": "B",
+ "step": 20,
+ "target": ""
+ },
+ {
+ "expr": "node_load15{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 4,
+ "legendFormat": "load 15m",
+ "refId": "C",
+ "step": 20,
+ "target": ""
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "System load",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "percentunit",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 2,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 16
+ },
+ "id": 26,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "node_timex_pps_jitter_seconds{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "node_timex_pps_jitter_seconds",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 12,
+ "y": 16
+ },
+ "id": 28,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "node_ntp_offset_seconds{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "node_ntp_offset_seconds",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 24
+ },
+ "id": 14,
+ "panels": [],
+ "title": "Node Status",
+ "type": "row"
+ },
+ {
+ "alerting": {},
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 8,
+ "w": 23,
+ "x": 0,
+ "y": 25
+ },
+ "id": 3,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "100 - (avg by (cpu) (irate(node_cpu_seconds_total{mode=\"idle\", nc_region=~\"$region\", node=\"$node\"}[1h])) * 100)",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 10,
+ "legendFormat": "",
+ "refId": "A",
+ "step": 50
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Idle cpu",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "percent",
+ "label": "cpu usage",
+ "logBase": 1,
+ "max": 100,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "alerting": {},
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 23,
+ "x": 0,
+ "y": 33
+ },
+ "id": 4,
+ "legend": {
+ "alignAsTable": false,
+ "avg": false,
+ "current": false,
+ "hideEmpty": false,
+ "hideZero": false,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "node_memory_SwapFree{instance=\"$server\",job=\"prometheus\"}",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "node_memory_MemTotal_bytes{node=\"$node\", nc_region=\"$region\"} - node_memory_MemFree_bytes{node=\"$node\", nc_region=\"$region\"} - node_memory_Buffers_bytes{node=\"$node\", nc_region=\"$region\"} - node_memory_Cached_bytes{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "hide": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "memory used",
+ "metric": "",
+ "refId": "C",
+ "step": 10
+ },
+ {
+ "expr": "node_memory_Buffers_bytes{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "memory buffers",
+ "metric": "",
+ "refId": "E",
+ "step": 10
+ },
+ {
+ "expr": "node_memory_Cached_bytes{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "memory cached",
+ "metric": "",
+ "refId": "F",
+ "step": 10
+ },
+ {
+ "expr": "node_memory_MemFree_bytes{node=\"$node\", nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "memory free",
+ "metric": "",
+ "refId": "D",
+ "step": 10
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Memory usage",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "alerting": {},
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 23,
+ "x": 0,
+ "y": 40
+ },
+ "id": 6,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "read",
+ "yaxis": 1
+ },
+ {
+ "alias": "{instance=\"$server\"}",
+ "yaxis": 2
+ },
+ {
+ "alias": "io time",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by (instance) (rate(node_disk_read_bytes_total{node=\"$node\", nc_region=\"$region\"}[1h]))",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 4,
+ "legendFormat": "read",
+ "refId": "A",
+ "step": 20,
+ "target": ""
+ },
+ {
+ "expr": "sum by (instance) (rate(node_disk_written_bytes_total{node=\"$node\", nc_region=\"$region\"}[1h]))",
+ "format": "time_series",
+ "intervalFactor": 4,
+ "legendFormat": "written",
+ "refId": "B",
+ "step": 20
+ },
+ {
+ "expr": "sum by (instance) (rate(node_disk_io_time_seconds_total{node=\"$node\", nc_region=\"$region\"}[1h]))",
+ "format": "time_series",
+ "intervalFactor": 4,
+ "legendFormat": "io time",
+ "refId": "C",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Disk I/O",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "ms",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "alerting": {},
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 9,
+ "w": 23,
+ "x": 0,
+ "y": 47
+ },
+ "id": 8,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "transmitted ",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(node_network_receive_bytes_total{node=\"$node\", nc_region=\"$region\",device!~\"lo\"}[5m])",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 2,
+ "legendFormat": "{{device}}",
+ "refId": "A",
+ "step": 10,
+ "target": ""
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Network received",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "alerting": {},
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 8,
+ "w": 23,
+ "x": 0,
+ "y": 56
+ },
+ "id": 10,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "transmitted ",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(node_network_transmit_bytes_total{node=\"$node\", nc_region=\"$region\", device!~\"lo\"}[5m])",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 2,
+ "legendFormat": "{{device}}",
+ "refId": "B",
+ "step": 10,
+ "target": ""
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Network transmitted",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "$DS_PROMETHEUS",
+ "fill": 1,
+ "gridPos": {
+ "h": 10,
+ "w": 24,
+ "x": 0,
+ "y": 64
+ },
+ "id": 12,
+ "interval": "",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "dbus_serial{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{node}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": "1w",
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "systemd_dbus_serial",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": false,
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "label_values(node_uname_info{nc_region=\"$region\"}, node)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Node",
+ "multi": false,
+ "name": "node",
+ "options": [],
+ "query": "label_values(node_uname_info{nc_region=\"$region\"}, node)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Nodes Status",
+ "uid": "nodes-status",
+ "version": 7
+ }
+ prometheus: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "Prometheus which you want to monitor",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": ""
+ },
+ {
+ "type": "panel",
+ "id": "text",
+ "name": "Text",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ },
+ {
+ "datasource": "${DS_PROMETHEUS}",
+ "enable": true,
+ "expr": "count(sum(up{instance=\"$instance\",nc_region=~\"$region\"}) by (instance) < 1)",
+ "hide": false,
+ "iconColor": "rgb(250, 44, 18)",
+ "limit": 100,
+ "name": "downage",
+ "showIn": 0,
+ "step": "30s",
+ "tagKeys": "instance",
+ "textFormat": "prometheus down",
+ "titleFormat": "Downage",
+ "type": "alert"
+ },
+ {
+ "datasource": "${DS_PROMETHEUS}",
+ "enable": true,
+ "expr": "sum(changes(prometheus_config_last_reload_success_timestamp_seconds[10m])) by (instance)",
+ "hide": false,
+ "iconColor": "#fceaca",
+ "limit": 100,
+ "name": "Reload",
+ "showIn": 0,
+ "step": "5m",
+ "tagKeys": "instance",
+ "tags": [],
+ "titleFormat": "Reload",
+ "type": "tags"
+ }
+ ]
+ },
+ "description": "Dashboard for monitoring of Prometheus v2.x.x",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": 3681,
+ "graphTooltip": 1,
+ "id": 224,
+ "links": [
+ {
+ "icon": "info",
+ "tags": [],
+ "targetBlank": true,
+ "title": "Dashboard's Github ",
+ "tooltip": "Github repo of this dashboard",
+ "type": "link",
+ "url": "https://github.com/FUSAKLA/Prometheus2-grafana-dashboard"
+ },
+ {
+ "icon": "doc",
+ "tags": [],
+ "targetBlank": true,
+ "title": "Prometheus Docs",
+ "tooltip": "",
+ "type": "link",
+ "url": "http://prometheus.io/docs/introduction/overview/"
+ }
+ ],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 53,
+ "panels": [],
+ "repeat": null,
+ "title": "Header instance info",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#bf1b00"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 1,
+ "format": "s",
+ "gauge": {
+ "maxValue": 1000000,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 41,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "time() - process_start_time_seconds{instance=\"$instance\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "instant": false,
+ "intervalFactor": 2,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Uptime",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#bf1b00"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "short",
+ "gauge": {
+ "maxValue": 1000000,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 8,
+ "x": 4,
+ "y": 1
+ },
+ "id": 42,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "prometheus_tsdb_head_series{instance=\"$instance\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "instant": false,
+ "intervalFactor": 2,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "500000,800000,1000000",
+ "title": "Total count of time series",
+ "type": "singlestat",
+ "valueFontSize": "150%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 4,
+ "x": 12,
+ "y": 1
+ },
+ "id": 48,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "version",
+ "targets": [
+ {
+ "expr": "prometheus_build_info{instance=\"$instance\",nc_region=~\"$region\"}",
+ "format": "table",
+ "instant": true,
+ "intervalFactor": 2,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Version",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "format": "ms",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 4,
+ "x": 16,
+ "y": 1
+ },
+ "id": 49,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "prometheus_tsdb_head_max_time{instance=\"$instance\",nc_region=~\"$region\"} - prometheus_tsdb_head_min_time{instance=\"$instance\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "instant": true,
+ "intervalFactor": 2,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "",
+ "title": "Actual head block length",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "content": "",
+ "gridPos": {
+ "h": 5,
+ "w": 2,
+ "x": 20,
+ "y": 1
+ },
+ "height": "",
+ "id": 50,
+ "links": [],
+ "mode": "html",
+ "options": {},
+ "title": "",
+ "transparent": true,
+ "type": "text"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": true,
+ "colors": [
+ "#e6522c",
+ "rgba(237, 129, 40, 0.89)",
+ "#299c46"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 2,
+ "x": 22,
+ "y": 1
+ },
+ "id": 52,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "2.12",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "10,20",
+ "title": "",
+ "transparent": true,
+ "type": "singlestat",
+ "valueFontSize": "200%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "avg"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 6
+ },
+ "id": 54,
+ "panels": [],
+ "repeat": null,
+ "title": "Main info",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 0,
+ "y": 7
+ },
+ "id": 15,
+ "legend": {
+ "avg": true,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "max(prometheus_engine_query_duration_seconds{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, slice)",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "max duration for {{slice}}",
+ "metric": "prometheus_local_storage_rushed_mode",
+ "refId": "A",
+ "step": 900
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Query elapsed time",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": "",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 8,
+ "y": 7
+ },
+ "id": 17,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_tsdb_head_series_created_total{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "created on {{ instance }}",
+ "metric": "prometheus_local_storage_maintain_series_duration_seconds_count",
+ "refId": "A",
+ "step": 1800
+ },
+ {
+ "expr": "sum(prometheus_tsdb_head_series_removed_total{instance=\"$instance\",nc_region=~\"$region\"}) by (instance) * -1",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "removed on {{ instance }}",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Head series created/deleted",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 16,
+ "y": 7
+ },
+ "id": 13,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum_over_time(prometheus_target_scrapes_exceeded_sample_limit_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "exceeded_sample_limit on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "A",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_target_scrapes_sample_duplicate_timestamp_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "duplicate_timestamp on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "B",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_target_scrapes_sample_out_of_bounds_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "out_of_bounds on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "C",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_target_scrapes_sample_out_of_order_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "out_of_order on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "D",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_rule_evaluation_failures_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "rule_evaluation_failure on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "G",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_tsdb_compactions_failed_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "tsdb_compactions_failed on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "K",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_tsdb_reloads_failures_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "tsdb_reloads_failures on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "L",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_tsdb_head_series_not_found{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "head_series_not_found on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "E",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_evaluator_iterations_missed_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "evaluator_iterations_missed on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "O",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_evaluator_iterations_skipped_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "evaluator_iterations_skipped on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "P",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Prometheus errors",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 14
+ },
+ "id": 55,
+ "panels": [],
+ "repeat": null,
+ "title": "Scrape & rule duration",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "description": "",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 15
+ },
+ "id": 25,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": false,
+ "show": false,
+ "sort": "max",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "prometheus_target_interval_length_seconds{instance=\"$instance\",quantile=\"0.99\",nc_region=~\"$region\"} - 60",
+ "format": "time_series",
+ "interval": "2m",
+ "intervalFactor": 1,
+ "legendFormat": "{{instance}}",
+ "metric": "",
+ "refId": "A",
+ "step": 300
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Scrape delay (counts with 1m scrape interval)",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 15
+ },
+ "id": 14,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "Queue length",
+ "yaxis": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_rule_evaluation_duration_seconds{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, quantile)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Queue length",
+ "metric": "prometheus_local_storage_indexing_queue_length",
+ "refId": "B",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Rule evaulation duration",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 22
+ },
+ "id": 56,
+ "panels": [],
+ "repeat": null,
+ "title": "Requests & queries",
+ "type": "row"
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 0,
+ "y": 23
+ },
+ "id": 18,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum_over_time(prometheus_http_requests_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ handler }} on {{ instance }}",
+ "metric": "",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Request count",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 6,
+ "y": 23
+ },
+ "id": 16,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "hideEmpty": true,
+ "hideZero": true,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "max(sum(prometheus_http_request_duration_seconds_sum{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, handler, quantile)) by (instance, handler) > 0",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 2,
+ "legendFormat": "{{ handler }} on {{ instance }}",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Request duration per handler",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "µs",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 12,
+ "y": 23
+ },
+ "id": 19,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum_over_time(prometheus_http_response_size_bytes_sum{instance=\"$instance\", nc_region=~\"$region\"}[$aggregation_interval]) > 0",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 2,
+ "legendFormat": "{{ handler }} in {{ instance }}",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Response size by handler",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Allocated bytes": "#F9BA8F",
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max count collector": "#bf1b00",
+ "Max count harvester": "#bf1b00",
+ "Max to persist": "#3F6833",
+ "RSS": "#890F02"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 18,
+ "y": 23
+ },
+ "id": 8,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/Max.*/",
+ "fill": 0,
+ "linewidth": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_engine_queries{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, handler)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Current count ",
+ "metric": "last",
+ "refId": "A",
+ "step": 1800
+ },
+ {
+ "expr": "sum(prometheus_engine_queries_concurrent_max{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, handler)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Max count",
+ "metric": "last",
+ "refId": "B",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cont of concurent queries",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 30
+ },
+ "id": 57,
+ "panels": [],
+ "repeat": null,
+ "title": "Alerting",
+ "type": "row"
+ },
+ {
+ "aliasColors": {
+ "Alert queue capacity on o collector": "#bf1b00",
+ "Alert queue capacity on o harvester": "#bf1b00",
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 0,
+ "y": 31
+ },
+ "id": 20,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/.*capacity.*/",
+ "fill": 0,
+ "linewidth": 2
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_notifications_queue_capacity{instance=\"$instance\",nc_region=~\"$region\"})by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Alert queue capacity ",
+ "metric": "prometheus_local_storage_checkpoint_last_size_bytes",
+ "refId": "A",
+ "step": 1800
+ },
+ {
+ "expr": "sum(prometheus_notifications_queue_length{instance=\"$instance\",nc_region=~\"$region\"})by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Alert queue size on ",
+ "metric": "prometheus_local_storage_checkpoint_last_size_bytes",
+ "refId": "B",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Alert queue size",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 8,
+ "y": 31
+ },
+ "id": 21,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_notifications_alertmanagers_discovered{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Checkpoint chunks written/s",
+ "metric": "prometheus_local_storage_checkpoint_series_chunks_written_sum",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Count of discovered alertmanagers",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 16,
+ "y": 31
+ },
+ "id": 39,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum_over_time(prometheus_notifications_dropped_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "notifications_dropped on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "F",
+ "step": 1800
+ },
+ {
+ "expr": "sum_over_time(prometheus_rule_evaluation_failures_total{rule_type=\"alerting\",instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "rule_evaluation_failures on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Alerting errors",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 38
+ },
+ "id": 58,
+ "panels": [],
+ "repeat": null,
+ "title": "Service discovery",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 0,
+ "y": 39
+ },
+ "id": 45,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "count_over_time(prometheus_target_sync_length_seconds_count{scrape_job=\"kubernetes-service-endpoints\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Count of target synces",
+ "refId": "A",
+ "step": 240
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Kubernetes SD sync count",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 6,
+ "y": 39
+ },
+ "id": 46,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "prometheus_target_scrapes_exceeded_sample_limit_total{instance=\"$instance\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "exceeded_sample_limit on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "A",
+ "step": 1800
+ },
+ {
+ "expr": "prometheus_sd_file_read_errors_total{instance=\"$instance\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "sd_file_read_error on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "E",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Service discovery errors",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 46
+ },
+ "id": 59,
+ "panels": [],
+ "repeat": null,
+ "title": "TSDB stats",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 0,
+ "y": 47
+ },
+ "id": 36,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(increase(prometheus_tsdb_reloads_total{instance=\"$instance\",nc_region=~\"$region\"}[30m])) by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ instance }}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Reloaded block from disk",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 6,
+ "y": 47
+ },
+ "id": 5,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_tsdb_blocks_loaded{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Loaded data blocks",
+ "metric": "prometheus_local_storage_memory_chunkdescs",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Loaded data blocks",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 12,
+ "y": 47
+ },
+ "id": 3,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "prometheus_tsdb_head_series{instance=\"$instance\",nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Time series count",
+ "metric": "prometheus_local_storage_memory_series",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Time series total count",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 18,
+ "y": 47
+ },
+ "id": 1,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum_over_time(prometheus_tsdb_head_samples_appended_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "samples/s {{instance}}",
+ "metric": "prometheus_local_storage_ingested_samples_total",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Samples Appended per second",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": "",
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 54
+ },
+ "id": 60,
+ "panels": [],
+ "repeat": null,
+ "title": "Head block stats",
+ "type": "row"
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833",
+ "To persist": "#9AC48A"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 0,
+ "y": 55
+ },
+ "id": 2,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/Max.*/",
+ "fill": 0
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_tsdb_head_chunks{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 2,
+ "legendFormat": "Head chunk count",
+ "metric": "prometheus_local_storage_memory_chunks",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Head chunks count",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 8,
+ "y": 55
+ },
+ "id": 35,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "max(prometheus_tsdb_head_max_time{instance=\"$instance\",nc_region=~\"$region\"}) by (instance) - min(prometheus_tsdb_head_min_time{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ instance }}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Length of head block",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "ms",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 16,
+ "y": 55
+ },
+ "id": 4,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(prometheus_tsdb_head_chunks_created_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])) by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "created on {{ instance }}",
+ "refId": "B"
+ },
+ {
+ "expr": "sum(rate(prometheus_tsdb_head_chunks_removed_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])) by (instance) * -1",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "deleted on {{ instance }}",
+ "refId": "C"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Head Chunks Created/Deleted per second",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 62
+ },
+ "id": 61,
+ "panels": [],
+ "repeat": null,
+ "title": "Data maintenance",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 0,
+ "y": 63
+ },
+ "id": 33,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum_over_time(prometheus_tsdb_compaction_duration_seconds_sum{instance=\"$instance\",nc_region=~\"$region\"}[30m]) / sum_over_time(prometheus_tsdb_compaction_duration_seconds_count{instance=\"$instance\",nc_region=~\"$region\"}[30m])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ instance }}",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Compaction duration",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 6,
+ "y": 63
+ },
+ "id": 34,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_tsdb_head_gc_duration_seconds_sum{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, quantile)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ quantile }} on {{ instance }}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Go Garbage collection duration",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 12,
+ "y": 63
+ },
+ "id": 37,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_tsdb_wal_truncate_duration_seconds_sum{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, quantile)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ quantile }} on {{ instance }}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "WAL truncate duration seconds",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 18,
+ "y": 63
+ },
+ "id": 38,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(prometheus_tsdb_wal_fsync_duration_seconds{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, quantile)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{ quantile }} {{ instance }}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "WAL fsync duration seconds",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "s",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 70
+ },
+ "id": 62,
+ "panels": [],
+ "repeat": null,
+ "title": "RAM&CPU",
+ "type": "row"
+ },
+ {
+ "aliasColors": {
+ "Allocated bytes": "#7EB26D",
+ "Allocated bytes - 1m max": "#BF1B00",
+ "Allocated bytes - 1m min": "#BF1B00",
+ "Allocated bytes - 5m max": "#BF1B00",
+ "Allocated bytes - 5m min": "#BF1B00",
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833",
+ "RSS": "#447EBC"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": null,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 0,
+ "y": 71
+ },
+ "id": 6,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "alias": "/-/",
+ "fill": 0
+ },
+ {
+ "alias": "collector heap size",
+ "color": "#E0752D",
+ "fill": 0,
+ "linewidth": 2
+ },
+ {
+ "alias": "collector kubernetes memory limit",
+ "color": "#BF1B00",
+ "fill": 0,
+ "linewidth": 3
+ }
+ ],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(process_resident_memory_bytes{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 2,
+ "legendFormat": "Total resident memory - {{instance}}",
+ "metric": "process_resident_memory_bytes",
+ "refId": "B",
+ "step": 1800
+ },
+ {
+ "expr": "sum(go_memstats_alloc_bytes{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 2,
+ "legendFormat": "Total llocated bytes - {{instance}}",
+ "metric": "go_memstats_alloc_bytes",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Memory",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {
+ "Allocated bytes": "#F9BA8F",
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833",
+ "RSS": "#890F02"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 8,
+ "y": 71
+ },
+ "id": 7,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(go_memstats_alloc_bytes_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "Allocated Bytes/s",
+ "metric": "go_memstats_alloc_bytes",
+ "refId": "A",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Allocations per second",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 2,
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 16,
+ "y": 71
+ },
+ "id": 9,
+ "legend": {
+ "alignAsTable": false,
+ "avg": false,
+ "current": false,
+ "hideEmpty": false,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(rate(process_cpu_seconds_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])) by (instance)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "CPU/s",
+ "metric": "prometheus_local_storage_ingested_samples_total",
+ "refId": "B",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "CPU per second",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": [
+ "avg"
+ ]
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 78
+ },
+ "id": 63,
+ "panels": [],
+ "repeat": null,
+ "title": "Contrac errors",
+ "type": "row"
+ },
+ {
+ "aliasColors": {
+ "Chunks": "#1F78C1",
+ "Chunks to persist": "#508642",
+ "Max chunks": "#052B51",
+ "Max to persist": "#3F6833"
+ },
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 24,
+ "x": 0,
+ "y": 79
+ },
+ "id": 47,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": false,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum(increase(net_conntrack_dialer_conn_failed_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])) by (instance)",
+ "format": "time_series",
+ "hide": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "legendFormat": "conntrack_dialer_conn_failed on {{ instance }}",
+ "metric": "prometheus_local_storage_chunk_ops_total",
+ "refId": "M",
+ "step": 1800
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Net errors",
+ "tooltip": {
+ "msResolution": false,
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "prometheus"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": ".+",
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(prometheus_build_info{nc_region=~\"$region\"}, instance)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Instance",
+ "multi": false,
+ "name": "instance",
+ "options": [],
+ "query": "label_values(prometheus_build_info{nc_region=~\"$region\"}, instance)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 2,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "auto": true,
+ "auto_count": 30,
+ "auto_min": "2m",
+ "current": {
+ "text": "30m",
+ "value": "30m"
+ },
+ "hide": 0,
+ "label": "aggregation intarval",
+ "name": "aggregation_interval",
+ "options": [
+ {
+ "selected": false,
+ "text": "auto",
+ "value": "$__auto_interval_aggregation_interval"
+ },
+ {
+ "selected": false,
+ "text": "1m",
+ "value": "1m"
+ },
+ {
+ "selected": false,
+ "text": "10m",
+ "value": "10m"
+ },
+ {
+ "selected": true,
+ "text": "30m",
+ "value": "30m"
+ },
+ {
+ "selected": false,
+ "text": "1h",
+ "value": "1h"
+ },
+ {
+ "selected": false,
+ "text": "6h",
+ "value": "6h"
+ },
+ {
+ "selected": false,
+ "text": "12h",
+ "value": "12h"
+ },
+ {
+ "selected": false,
+ "text": "1d",
+ "value": "1d"
+ },
+ {
+ "selected": false,
+ "text": "7d",
+ "value": "7d"
+ },
+ {
+ "selected": false,
+ "text": "14d",
+ "value": "14d"
+ },
+ {
+ "selected": false,
+ "text": "30d",
+ "value": "30d"
+ }
+ ],
+ "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d",
+ "refresh": 2,
+ "skipUrlSync": false,
+ "type": "interval"
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Prometheus2.12.0",
+ "uid": "prometheus",
+ "version": 7
+ }
+ calico: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Calico cluster monitoring dashboard",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": 3244,
+ "graphTooltip": 0,
+ "id": 137,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "true": 0,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 15,
+ "panels": [],
+ "repeat": null,
+ "title": "Felix",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 1,
+ "w": 12,
+ "x": 0,
+ "y": 1
+ },
+ "id": 1,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_active_local_endpoints{nc_region=~\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Active Local Endpoints",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 1,
+ "w": 12,
+ "x": 12,
+ "y": 1
+ },
+ "id": 3,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_active_local_policies{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Active Local Policies",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 8,
+ "w": 12,
+ "x": 0,
+ "y": 8
+ },
+ "id": 2,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_active_local_selectors{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Active Local Selectors",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 8,
+ "w": 12,
+ "x": 12,
+ "y": 8
+ },
+ "id": 4,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_active_local_tags{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Active Local Tags",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 15,
+ "w": 12,
+ "x": 0,
+ "y": 15
+ },
+ "id": 5,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_cluster_num_host_endpoints{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cluster Host Endpoints",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 15,
+ "w": 12,
+ "x": 12,
+ "y": 15
+ },
+ "id": 6,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_cluster_num_workload_endpoints{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Cluster Workload Endpoints",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 22,
+ "w": 12,
+ "x": 0,
+ "y": 22
+ },
+ "id": 7,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_cluster_num_hosts{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Clusters Hosts",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 22,
+ "w": 12,
+ "x": 12,
+ "y": 22
+ },
+ "id": 8,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_ipsets_calico{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Active IP Sets",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 29,
+ "w": 12,
+ "x": 0,
+ "y": 29
+ },
+ "id": 9,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_iptables_chains{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Active IP Tables Chains",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 29,
+ "w": 12,
+ "x": 12,
+ "y": 29
+ },
+ "id": 10,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_ipset_errors{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "IP Set Command Failures",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 36,
+ "w": 12,
+ "x": 0,
+ "y": 36
+ },
+ "id": 11,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_iptables_save_errors{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "IP Tables Save Errors",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 36,
+ "w": 12,
+ "x": 12,
+ "y": 36
+ },
+ "id": 12,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_iptables_restore_errors{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "IP Tables Restore Errors",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 43,
+ "w": 12,
+ "x": 0,
+ "y": 43
+ },
+ "id": 13,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_resyncs_started{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Felix Resyncing Datastore",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 43,
+ "w": 12,
+ "x": 12,
+ "y": 43
+ },
+ "id": 14,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_int_dataplane_failures{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Dataplane failed updates",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 43,
+ "w": 12,
+ "x": 0,
+ "y": 50
+ },
+ "id": 16,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_int_dataplane_addr_msg_batch_size{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Felix int dataplane addr msg batch size",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 43,
+ "w": 12,
+ "x": 12,
+ "y": 50
+ },
+ "id": 17,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": true,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "felix_int_dataplane_iface_msg_batch_size{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Felix int dataplane iface msg batch size",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "true": 43,
+ "w": 12,
+ "x": 0,
+ "y": 57
+ },
+ "id": 18,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "go_memstats_frees_total{nc_region=\"$region\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{nc_region}} - {{instance}}",
+ "refId": "A",
+ "step": 20
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "go memstats frees total",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "bytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [
+ "calico"
+ ],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Kubernetes Calico",
+ "uid": "kubernetes-calico",
+ "version": 1
+ }
+ openvswitch: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "6.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 82,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 6,
+ "panels": [],
+ "title": "SRIOV",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 0,
+ "y": 1
+ },
+ "id": 12,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(sriov_rx_bytes{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}} vfid:{{vfid}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "sriov_rx_bytes",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 10,
+ "y": 1
+ },
+ "id": 13,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 2,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(sriov_tx_bytes{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}} vfid:{{vfid}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "sriov_tx_bytes",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 0,
+ "y": 8
+ },
+ "id": 11,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(sriov_rx_dropped{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}} vfid:{{vfid}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "sriov_rx_dropped",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 10,
+ "y": 8
+ },
+ "id": 21,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(sriov_tx_dropped{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}} vfid:{{vfid}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "sriov_tx_dropped",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 0,
+ "y": 15
+ },
+ "id": 7,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(sriov_tx_errors{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}} vfid:{{vfid}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "sriov_tx_errors",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 22
+ },
+ "id": 9,
+ "panels": [],
+ "title": "Openvswitch",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 0,
+ "y": 23
+ },
+ "id": 15,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(ovs_rx_bytes{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "ovs_rx_bytes",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 10,
+ "y": 23
+ },
+ "id": 14,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(ovs_tx_bytes{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "ovs_tx_bytes",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 0,
+ "y": 30
+ },
+ "id": 10,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(ovs_rx_errors{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "ovs_rx_errors",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 10,
+ "x": 10,
+ "y": 30
+ },
+ "id": 20,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rate(ovs_tx_errors{node_name=~\"$node\", nc_region=~\"$region\"}[5m])",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{interface}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "ovs_tx_errors",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus Source",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(node_uname_info{nc_region=\"$region\"}, hostname)",
+ "hide": 0,
+ "includeAll": true,
+ "label": "Node",
+ "multi": false,
+ "name": "node",
+ "options": [],
+ "query": "label_values(node_uname_info{nc_region=\"$region\"}, hostname)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openvswitch Stats",
+ "uid": "openvswitch-stats",
+ "version": 1
+ }
+ openstack-metrics: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 149,
+ "links": [],
+ "panels": [
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#d44a3a",
+ "#299c46",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 0,
+ "y": 0
+ },
+ "id": 12,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_nova",
+ "dashboard": "Openstack_Services_Nova",
+ "includeVars": true,
+ "keepTime": false,
+ "name": "Drilldown dashboard",
+ "params": "var-Service=nova",
+ "title": "Openstack_Services_Nova",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_nova_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,2",
+ "title": "Nova_API_Check",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "API OK",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "UNKW",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#d44a3a",
+ "#299c46",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 3,
+ "y": 0
+ },
+ "id": 13,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_neutron",
+ "dashboard": "Openstack_Services_Neutron",
+ "includeVars": true,
+ "name": "Drilldown dashboard",
+ "params": "var-Service=neutron",
+ "title": "Openstack_Services_Neutron",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_neutron_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,2",
+ "title": "Neutron_API_Check",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "API OK",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "UNKW",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#d44a3a",
+ "#299c46",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 6,
+ "y": 0
+ },
+ "id": 14,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_cinder",
+ "dashboard": "Openstack_Services_Cinder",
+ "includeVars": true,
+ "name": "Drilldown dashboard",
+ "params": "var-Service=cinder",
+ "title": "Openstack_Services_Cinder",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_cinder_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,2",
+ "title": "Cinder_API_Check",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "API OK",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "UNKW",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#d44a3a",
+ "#299c46",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 9,
+ "y": 0
+ },
+ "id": 10,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_glance",
+ "dashboard": "Openstack_Services_Glance",
+ "includeVars": true,
+ "name": "Drilldown dashboard",
+ "params": "var-Service=glance",
+ "title": "Openstack_Services_Glance",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_glance_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,2",
+ "title": "Glance_API_Check",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "API OK",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "UNKW",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#d44a3a",
+ "#cca300",
+ "#299c46"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 12,
+ "y": 0
+ },
+ "id": 15,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_heat",
+ "dashboard": "Openstack_Services_Heat",
+ "includeVars": true,
+ "name": "Drilldown dashboard",
+ "params": "",
+ "title": "Openstack_Services_Heat",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(openstack_check_heat_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_check_heat_cfn_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "2,2",
+ "title": "Heat_API_Check (Heat and Heat_CFN)",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "API OK",
+ "value": "2"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "unknown",
+ "value": "3"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#d44a3a",
+ "#299c46",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 15,
+ "y": 0
+ },
+ "id": 16,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_keystone",
+ "dashboard": "Openstack_Services_Keystone",
+ "includeVars": true,
+ "params": "",
+ "targetBlank": false,
+ "title": "Openstack_Services_Keystone",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_keystone_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,2",
+ "title": "Keystone_API_Check",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "API OK",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "UNKW",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#d44a3a",
+ "#299c46",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 18,
+ "y": 0
+ },
+ "id": 17,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_swift",
+ "dashboard": "Openstack_Services_Swift",
+ "includeVars": true,
+ "title": "Openstack_Services_Swift",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_swift_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,2",
+ "title": "Swift_API_Check",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "API OK",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "UNKW",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#d44a3a",
+ "#299c46",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 21,
+ "y": 0
+ },
+ "id": 18,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_placement",
+ "dashboard": "Openstack_Services_Placement",
+ "includeVars": true,
+ "title": "Openstack_Services_Placement",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_placement_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,2",
+ "title": "Placement_API_Check",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "API CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "API OK",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "UNKW",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 0,
+ "y": 5
+ },
+ "id": 2,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_nova",
+ "dashboard": "Openstack_Services_Nova",
+ "includeVars": true,
+ "name": "Drilldown dashboard",
+ "params": "",
+ "title": "Openstack_Services_Nova",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 2,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "0",
+ "text": "Services OK",
+ "to": "0"
+ },
+ {
+ "from": "1",
+ "text": "Services CRITICAL",
+ "to": "100"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(openstack_services_nova_compute_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_compute_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_conductor_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_conductor_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_scheduler_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_scheduler_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "instant": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Nova",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "HEALTHY",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "UNHEALTHY",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 3,
+ "y": 5
+ },
+ "id": 3,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_neutron",
+ "dashboard": "Openstack_Services_Neutron",
+ "includeVars": true,
+ "name": "Drilldown dashboard",
+ "params": "",
+ "title": "Openstack_Services_Neutron",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 2,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "0",
+ "text": "Services OK",
+ "to": "0"
+ },
+ {
+ "from": "1",
+ "text": "Services CRITICAL",
+ "to": "100"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(openstack_services_neutron_l3_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_l3_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_dhcp_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_dhcp_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_metadata_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_metadata_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_openvswitch_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_openvswitch_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_sriov_nic_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_sriov_nic_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Neutron",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "HEALTHY",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "UNHEALTHY",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 5,
+ "w": 3,
+ "x": 6,
+ "y": 5
+ },
+ "id": 11,
+ "interval": "> 60s",
+ "links": [
+ {
+ "dashUri": "db/openstack_services_cinder",
+ "dashboard": "Openstack_Services_Cinder",
+ "includeVars": true,
+ "name": "Drilldown dashboard",
+ "params": "",
+ "title": "Openstack_Services_Cinder",
+ "type": "dashboard"
+ }
+ ],
+ "mappingType": 2,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "0",
+ "text": "Services OK",
+ "to": "0"
+ },
+ {
+ "from": "1",
+ "text": "Services CRITICAL",
+ "to": "100"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(openstack_services_cinder_volume_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_volume_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_backup_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_backup_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_scheduler_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_scheduler_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Cinder",
+ "type": "singlestat",
+ "valueFontSize": "50%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "no data",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "CRIT",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ },
+ {
+ "op": "=",
+ "text": "UNKW",
+ "value": "2"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 10
+ },
+ "id": 5,
+ "panels": [],
+ "title": "Resource Utilization",
+ "type": "row"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 0,
+ "gridPos": {
+ "h": 9,
+ "w": 8,
+ "x": 0,
+ "y": 11
+ },
+ "id": 7,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": true,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "openstack_total_used_ram_MB{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "Used",
+ "refId": "A"
+ },
+ {
+ "expr": "openstack_total_free_ram_MB{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "Free",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "os_vm_ram_usage",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decmbytes",
+ "label": "Memory Usage",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 0,
+ "gridPos": {
+ "h": 9,
+ "w": 8,
+ "x": 8,
+ "y": 11
+ },
+ "id": 8,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": true,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "openstack_total_used_vcpus{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "Used",
+ "refId": "A"
+ },
+ {
+ "expr": "openstack_total_free_vcpus{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "Free",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "os_vm_vcpu_usage",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "percent",
+ "label": "VCPU Usage",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 0,
+ "gridPos": {
+ "h": 9,
+ "w": 8,
+ "x": 16,
+ "y": 11
+ },
+ "id": 9,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": " openstack_total_used_disk_GB{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "interval": "",
+ "intervalFactor": 1,
+ "legendFormat": "Used",
+ "refId": "A"
+ },
+ {
+ "expr": "openstack_total_free_disk_GB{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "Free",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "os_vm_disk_usage",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "GBs",
+ "label": "disk Usage",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack Region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Metrics_Overall",
+ "uid": "openstack-metrics-overall",
+ "version": 3
+ }
+ openstack-nova: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 76,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Nova API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 40,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_nova_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Nova_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 43,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"nova.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 1
+ },
+ "id": 44,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_nova_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 8
+ },
+ "id": 7,
+ "panels": [],
+ "repeat": "openstack_region",
+ "title": "Nova",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 0,
+ "y": 9
+ },
+ "id": 9,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "maxPerRow": 1,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "repeat": "type",
+ "repeatDirection": "v",
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_nova_compute_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 4,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Nova-compute-down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 2,
+ "y": 9
+ },
+ "id": 11,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_nova_compute_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Nova-compute-disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 4,
+ "y": 9
+ },
+ "id": 20,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_nova_conductor_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Nova-conductor-disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 6,
+ "y": 9
+ },
+ "id": 23,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_nova_conductor_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Nova-conductor-down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 8,
+ "y": 9
+ },
+ "id": 19,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_nova_scheduler_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Nova-scheduler-down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 10,
+ "y": 9
+ },
+ "id": 24,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_nova_scheduler_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Nova-scheduler-disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 0,
+ "gridPos": {
+ "h": 9,
+ "w": 24,
+ "x": 0,
+ "y": 16
+ },
+ "hideTimeOverride": false,
+ "id": 15,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 1,
+ "points": false,
+ "renderer": "flot",
+ "repeat": null,
+ "repeatDirection": "h",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "openstack_services_nova_nova_consoleauth{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ },
+ {
+ "expr": "openstack_services_nova_nova_compute{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "B"
+ },
+ {
+ "expr": "openstack_services_nova_nova_conductor{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "C"
+ },
+ {
+ "expr": "openstack_services_nova_nova_scheduler{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "D"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Openstack_service_nova",
+ "tooltip": {
+ "shared": true,
+ "sort": 1,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": null,
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": "1",
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack openstack_region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Services_Nova",
+ "uid": "openstack-services-nova",
+ "version": 2
+ }
+ openstack-neutron: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 188,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Neutron API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 40,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_neutron_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Neutron_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 43,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"neutron.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 1
+ },
+ "id": 44,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_neutron_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 8
+ },
+ "id": 13,
+ "panels": [],
+ "repeat": "agent",
+ "title": "Neutron",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 0,
+ "y": 9
+ },
+ "id": 28,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_l3_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_I3_agent_down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 2,
+ "y": 9
+ },
+ "id": 26,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_l3_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_I3_agent_disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 4,
+ "y": 9
+ },
+ "id": 29,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_dhcp_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_dhcp_agent_down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 6,
+ "y": 9
+ },
+ "id": 27,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_dhcp_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_dhcp_agent_disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 8,
+ "y": 9
+ },
+ "id": 30,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_metadata_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_metadata_agent_down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 10,
+ "y": 9
+ },
+ "id": 31,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_metadata_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$nc_region\", namespace=\"$namespace\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_metadata_agent_disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 12,
+ "y": 9
+ },
+ "id": 33,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_openvswitch_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_openvswitch_agent_down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 14,
+ "y": 9
+ },
+ "id": 32,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_openvswitch_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$nc_region\", namespace=\"$namespace\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_openvswitch_agent_disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 16,
+ "y": 9
+ },
+ "id": 45,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_sriov_nic_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_sriov_nic_agent_down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 18,
+ "y": 9
+ },
+ "id": 46,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_sriov_nic_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "neutron_sriov_nic_agent_disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 0,
+ "gridPos": {
+ "h": 9,
+ "w": 24,
+ "x": 0,
+ "y": 16
+ },
+ "hideTimeOverride": false,
+ "id": 15,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 1,
+ "points": false,
+ "renderer": "flot",
+ "repeat": null,
+ "repeatDirection": "h",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "openstack_services_neutron_neutron_l3_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ },
+ {
+ "expr": "openstack_services_neutron_neutron_metadata_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "B"
+ },
+ {
+ "expr": "openstack_services_neutron_neutron_dhcp_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "C"
+ },
+ {
+ "expr": "openstack_services_neutron_neutron_openvswitch_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "D"
+ },
+ {
+ "expr": "openstack_services_neutron_neutron_sriov_nic_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "E"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Neutron_Agents",
+ "tooltip": {
+ "shared": true,
+ "sort": 1,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": null,
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": "1",
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack openstack_region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Services_Neutron",
+ "uid": "openstack-services-neutron",
+ "version": 2
+ }
+ openstack-cinder: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 152,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Cinder API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 40,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_cinder_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Cinder_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 43,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"cinder.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 1
+ },
+ "id": 44,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_cinder_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 8
+ },
+ "id": 7,
+ "panels": [],
+ "repeat": "openstack_region",
+ "title": "Cinder",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 0,
+ "y": 9
+ },
+ "id": 9,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "maxPerRow": 1,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "repeat": "type",
+ "repeatDirection": "v",
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_cinder_volume_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "hide": false,
+ "intervalFactor": 4,
+ "legendFormat": "",
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Cinder-volume-down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 2,
+ "y": 9
+ },
+ "id": 23,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_cinder_volume_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Cinder-volume-disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 4,
+ "y": 9
+ },
+ "id": 20,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_cinder_backup_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Cinder-backup-down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 6,
+ "y": 9
+ },
+ "id": 22,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_cinder_backup_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Cinder-backup-disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 8,
+ "y": 9
+ },
+ "id": 11,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_cinder_scheduler_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Cinder-scheduler-down",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "#299c46",
+ "rgba(237, 129, 40, 0.89)",
+ "#d44a3a"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 2,
+ "x": 10,
+ "y": 9
+ },
+ "id": 21,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "openstack_services_cinder_scheduler_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "A"
+ }
+ ],
+ "thresholds": "1,1",
+ "title": "Cinder-scheduler-disabled",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 0,
+ "gridPos": {
+ "h": 9,
+ "w": 24,
+ "x": 0,
+ "y": 16
+ },
+ "hideTimeOverride": false,
+ "id": 15,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "sort": "current",
+ "sortDesc": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 1,
+ "points": false,
+ "renderer": "flot",
+ "repeat": null,
+ "repeatDirection": "h",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "expr": "openstack_services_cinderv3_cinder_volume{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "",
+ "refId": "A"
+ },
+ {
+ "expr": "openstack_services_cinderv3_cinder_scheduler{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "B"
+ },
+ {
+ "expr": "openstack_services_cinderv3_cinder_backup{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "refId": "C"
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Openstack_service_cinder",
+ "tooltip": {
+ "shared": true,
+ "sort": 1,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "decimals": null,
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": "1",
+ "min": "0",
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": false,
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack openstack_region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Services_Cinder",
+ "uid": "openstack-services-cinder",
+ "version": 2
+ }
+ openstack-glance: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 155,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Glance API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 40,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_glance_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Glance_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 43,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"glance.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 1
+ },
+ "id": 44,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_glance_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack openstack_region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Services_Glance",
+ "uid": "openstack-services-glance",
+ "version": 2
+ }
+ openstack-heat: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 158,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Heat API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "#299c46"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 40,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_heat_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Heat_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 43,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"heat.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 1
+ },
+ "id": 44,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_heat_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 8
+ },
+ "id": 46,
+ "panels": [],
+ "title": "Heat CFN API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "#299c46"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 9
+ },
+ "id": 48,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_heat_cfn_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Heat_CFN_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 9
+ },
+ "id": 47,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"heat_cfn.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 9
+ },
+ "id": 49,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_heat_cfn_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "5m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack openstack_region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Services_Heat",
+ "uid": "openstack-services-heat",
+ "version": 2
+ }
+ openstack-keystone: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 185,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Keystone API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 40,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_keystone_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\",nc_region=~\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "instant": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Keystone_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 43,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"keystone.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\",nc_region=~\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 1
+ },
+ "id": 44,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_keystone_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\",nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": false,
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack openstack_region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Services_Keystone",
+ "uid": "openstack-service-keystone",
+ "version": 2
+ }
+ openstack-placement: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 77,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Placement API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 40,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_placement_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "instant": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Placement_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 43,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"placement.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 1
+ },
+ "id": 44,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_placement_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": false,
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack openstack_region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {
+ "tags": [],
+ "text": "openstack",
+ "value": "openstack"
+ },
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Services_Placement",
+ "uid": "openstack_services_placement",
+ "version": 1
+ }
+ openstack-swift: |-
+ {
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph",
+ "version": "5.0.0"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "5.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "singlestat",
+ "name": "Singlestat",
+ "version": "5.0.0"
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 203,
+ "links": [],
+ "panels": [
+ {
+ "collapsed": false,
+ "gridPos": {
+ "h": 1,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 42,
+ "panels": [],
+ "title": "Swift API",
+ "type": "row"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(225, 177, 40, 0.59)",
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 0,
+ "y": 1
+ },
+ "id": 40,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "openstack_check_swift_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "fill": "",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "null"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "groupby_field": "",
+ "instant": false,
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120
+ }
+ ],
+ "thresholds": "0,1",
+ "title": "Swift_API_Service",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "CRITICAL",
+ "value": "0"
+ },
+ {
+ "op": "=",
+ "text": "OK",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "cacheTimeout": null,
+ "colorBackground": false,
+ "colorValue": false,
+ "colors": [
+ "rgba(200, 54, 35, 0.88)",
+ "rgba(118, 245, 40, 0.73)",
+ "rgba(225, 177, 40, 0.59)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 4,
+ "x": 4,
+ "y": 1
+ },
+ "id": 43,
+ "interval": "> 60s",
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "50%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": true
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "column": "value",
+ "condition": "",
+ "expr": "sum(nginx_responses_total{server_zone=~\"swift.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"})",
+ "fill": "",
+ "format": "time_series",
+ "function": "count",
+ "groupBy": [
+ {
+ "interval": "auto",
+ "params": [
+ "auto"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupby_field": "",
+ "interval": "",
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": "",
+ "title": "HTTP 5xx errors",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "0",
+ "value": "null"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "editable": true,
+ "error": false,
+ "fill": 0,
+ "grid": {},
+ "gridPos": {
+ "h": 7,
+ "w": 13,
+ "x": 8,
+ "y": 1
+ },
+ "id": 44,
+ "interval": "> 60s",
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 3,
+ "links": [],
+ "nullPointMode": "connected",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": true,
+ "targets": [
+ {
+ "alias": "healthy",
+ "column": "value",
+ "expr": "openstack_check_swift_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}",
+ "format": "time_series",
+ "function": "last",
+ "groupBy": [
+ {
+ "params": [
+ "$interval"
+ ],
+ "type": "time"
+ },
+ {
+ "params": [
+ "0"
+ ],
+ "type": "fill"
+ }
+ ],
+ "groupByTags": [],
+ "intervalFactor": 2,
+ "policy": "default",
+ "rawQuery": false,
+ "refId": "A",
+ "resultFormat": "time_series",
+ "select": [],
+ "step": 120,
+ "tags": []
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "API Availability",
+ "tooltip": {
+ "msResolution": false,
+ "shared": false,
+ "sort": 0,
+ "value_type": "cumulative"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "none",
+ "label": "",
+ "logBase": 1,
+ "max": 1,
+ "min": 0,
+ "show": true
+ },
+ {
+ "format": "short",
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": false
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": false,
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "nc_region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Openstack openstack_region",
+ "multi": false,
+ "name": "openstack_region",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "${DS_PROMETHEUS}",
+ "definition": "",
+ "hide": 0,
+ "includeAll": false,
+ "label": "namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "Openstack_Services_Swift",
+ "uid": "openstack-services-swift",
+ "version": 2
+ }
+ rabbitmq_stats: |-
+ {
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": "-- Grafana --",
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "Basic rabbitmq host stats: Node Stats, Exchanges, Channels, Consumers, Connections, Queues, Messages, Messages per Queue, Memory, File Descriptors, Sockets.",
+ "editable": false,
+ "overwrite": true,
+ "gnetId": null,
+ "graphTooltip": 0,
+ "id": 87,
+ "links": [],
+ "panels": [
+ {
+ "cacheTimeout": null,
+ "colorBackground": true,
+ "colorValue": false,
+ "colors": [
+ "rgba(50, 172, 45, 0.97)",
+ "rgba(237, 129, 40, 0.89)",
+ "rgba(245, 54, 54, 0.9)"
+ ],
+ "datasource": "${DS_PROMETHEUS}",
+ "format": "none",
+ "gauge": {
+ "maxValue": 100,
+ "minValue": 0,
+ "show": false,
+ "thresholdLabels": false,
+ "thresholdMarkers": true
+ },
+ "gridPos": {
+ "h": 7,
+ "w": 6,
+ "x": 0,
+ "y": 0
+ },
+ "id": 13,
+ "interval": null,
+ "links": [],
+ "mappingType": 1,
+ "mappingTypes": [
+ {
+ "name": "value to text",
+ "value": 1
+ },
+ {
+ "name": "range to text",
+ "value": 2
+ }
+ ],
+ "maxDataPoints": 100,
+ "nullPointMode": "connected",
+ "nullText": null,
+ "options": {},
+ "postfix": "",
+ "postfixFontSize": "50%",
+ "prefix": "",
+ "prefixFontSize": "30%",
+ "rangeMaps": [
+ {
+ "from": "null",
+ "text": "N/A",
+ "to": "null"
+ }
+ ],
+ "sparkline": {
+ "fillColor": "rgba(31, 118, 189, 0.18)",
+ "full": false,
+ "lineColor": "rgb(31, 120, 193)",
+ "show": false
+ },
+ "tableColumn": "",
+ "targets": [
+ {
+ "expr": "count (rabbitmq_up{nc_region=~\"$region\"} == 1)",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "",
+ "metric": "rabbitmq_up",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": "Up,Down",
+ "timeFrom": "30s",
+ "title": "RabbitMQ Server",
+ "type": "singlestat",
+ "valueFontSize": "80%",
+ "valueMaps": [
+ {
+ "op": "=",
+ "text": "N/A",
+ "value": "null"
+ },
+ {
+ "op": "=",
+ "text": "Down",
+ "value": "0"
+ },
+ {
+ "op": ">=",
+ "text": "Up",
+ "value": "1"
+ }
+ ],
+ "valueName": "current"
+ },
+ {
+ "aliasColors": {},
+ "bars": true,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "prometheus",
+ "decimals": 0,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 18,
+ "x": 6,
+ "y": 0
+ },
+ "id": 12,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": false,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_running{nc_region=~\"$region\",node=~\"$rabbitmq_node\"}",
+ "format": "time_series",
+ "intervalFactor": 1,
+ "legendFormat": "{{pod}}",
+ "metric": "rabbitmq_running",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": "30s",
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Node up Stats",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 0,
+ "y": 7
+ },
+ "id": 6,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_exchanges{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{release_group}}:exchanges",
+ "metric": "rabbitmq_exchangesTotal",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Number of Exchanges",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 8,
+ "y": 7
+ },
+ "id": 4,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_channels{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{release_group}}:channels",
+ "metric": "rabbitmq_channelsTotal",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Number of Channels",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 16,
+ "y": 7
+ },
+ "id": 3,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_consumers{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{release_group}}:consumers",
+ "metric": "rabbitmq_consumersTotal",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Number of Consumers",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 0,
+ "y": 14
+ },
+ "id": 5,
+ "legend": {
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_connections{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{release_group}}:connections",
+ "metric": "rabbitmq_connectionsTotal",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Number of Connections",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 8,
+ "x": 8,
+ "y": 14
+ },
+ "id": 7,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_queues{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{release_group}}:queues",
+ "metric": "rabbitmq_queuesTotal",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Number of Queues",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 21
+ },
+ "id": 8,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "sum by (vhost)(rabbitmq_queue_messages_ready{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{vhost}}:ready",
+ "metric": "rabbitmq_queue_messages_ready",
+ "refId": "A",
+ "step": 2
+ },
+ {
+ "expr": "sum by (vhost)(rabbitmq_queue_messages_published_total{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{vhost}}:published",
+ "metric": "rabbitmq_queue_messages_published_total",
+ "refId": "B",
+ "step": 2
+ },
+ {
+ "expr": "sum by (vhost)(rabbitmq_queue_messages_delivered_total{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{vhost}}:delivered",
+ "metric": "rabbitmq_queue_messages_delivered_total",
+ "refId": "C",
+ "step": 2
+ },
+ {
+ "expr": "sum by (vhost)(rabbitmq_queue_messages_unacknowledged{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"})",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{vhost}}:unack",
+ "metric": "ack",
+ "refId": "D",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Messages/host",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "decimals": 0,
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 21
+ },
+ "id": 2,
+ "legend": {
+ "alignAsTable": true,
+ "avg": false,
+ "current": true,
+ "max": false,
+ "min": false,
+ "rightSide": false,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_queue_messages{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{queue}}:{{durable}}",
+ "metric": "rabbitmq_queue_messages",
+ "refId": "A",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Messages / Queue",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 28
+ },
+ "id": 9,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_node_mem_used{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{pod}}:used",
+ "metric": "rabbitmq_node_mem_used",
+ "refId": "A",
+ "step": 2
+ },
+ {
+ "expr": "rabbitmq_node_mem_limit{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{pod}}:limit",
+ "metric": "node_mem",
+ "refId": "B",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Memory",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "decbytes",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 12,
+ "y": 28
+ },
+ "id": 10,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_fd_used{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{pod}}:used",
+ "metric": "",
+ "refId": "A",
+ "step": 2
+ },
+ {
+ "expr": "rabbitmq_fd_total{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{pod}}:total",
+ "metric": "node_mem",
+ "refId": "B",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "FIle descriptors",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": "${DS_PROMETHEUS}",
+ "fill": 1,
+ "gridPos": {
+ "h": 7,
+ "w": 12,
+ "x": 0,
+ "y": 35
+ },
+ "id": 11,
+ "legend": {
+ "alignAsTable": true,
+ "avg": true,
+ "current": true,
+ "max": true,
+ "min": true,
+ "show": true,
+ "total": false,
+ "values": true
+ },
+ "lines": true,
+ "linewidth": 1,
+ "links": [],
+ "nullPointMode": "null",
+ "options": {},
+ "percentage": false,
+ "pointradius": 5,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "expr": "rabbitmq_sockets_used{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{pod}}:used",
+ "metric": "",
+ "refId": "A",
+ "step": 2
+ },
+ {
+ "expr": "rabbitmq_sockets_total{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}",
+ "format": "time_series",
+ "intervalFactor": 2,
+ "legendFormat": "{{pod}}:total",
+ "metric": "",
+ "refId": "B",
+ "step": 2
+ }
+ ],
+ "thresholds": [],
+ "timeFrom": null,
+ "timeRegions": [],
+ "timeShift": null,
+ "title": "Sockets ",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "buckets": null,
+ "mode": "time",
+ "name": null,
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ },
+ {
+ "format": "short",
+ "label": null,
+ "logBase": 1,
+ "max": null,
+ "min": null,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false,
+ "alignLevel": null
+ }
+ }
+ ],
+ "refresh": "1m",
+ "schemaVersion": 18,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": [
+ {
+ "current": {
+ "text": "prometheus",
+ "value": "prometheus"
+ },
+ "hide": 0,
+ "includeAll": false,
+ "label": "Prometheus datasource",
+ "multi": false,
+ "name": "DS_PROMETHEUS",
+ "options": [],
+ "query": "prometheus",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "type": "datasource"
+ },
+ {
+ "allValue": ".+",
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(nc_region)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "NC Region",
+ "multi": false,
+ "name": "region",
+ "options": [],
+ "query": "label_values(nc_region)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(rabbitmq_up{nc_region=\"$region\"}, kubernetes_namespace)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Namespace",
+ "multi": false,
+ "name": "namespace",
+ "options": [],
+ "query": "label_values(rabbitmq_up{nc_region=\"$region\"}, kubernetes_namespace)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ },
+ {
+ "allValue": null,
+ "current": {},
+ "datasource": "$DS_PROMETHEUS",
+ "definition": "label_values(rabbitmq_up{kubernetes_namespace=\"$namespace\"}, node)",
+ "hide": 0,
+ "includeAll": false,
+ "label": "Node",
+ "multi": false,
+ "name": "rabbitmq_node",
+ "options": [],
+ "query": "label_values(rabbitmq_up{kubernetes_namespace=\"$namespace\"}, node)",
+ "refresh": 1,
+ "regex": "",
+ "skipUrlSync": false,
+ "sort": 0,
+ "tagValuesQuery": "",
+ "tags": [],
+ "tagsQuery": "",
+ "type": "query",
+ "useTags": false
+ }
+ ]
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "5s",
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ],
+ "time_options": [
+ "5m",
+ "15m",
+ "1h",
+ "6h",
+ "12h",
+ "24h",
+ "2d",
+ "7d",
+ "30d"
+ ]
+ },
+ "timezone": "UTC",
+ "title": "RabbitMQ Stats",
+ "uid": "rabbitmq-stats",
+ "version": 4
+ }
dependencies:
- grafana-htk
...
diff --git a/global/software/charts/osh-infra/osh-infra-dashboards/kibana.yaml b/global/software/charts/osh-infra/osh-infra-dashboards/kibana.yaml
index 5931ca706..f6866e09a 100644
--- a/global/software/charts/osh-infra/osh-infra-dashboards/kibana.yaml
+++ b/global/software/charts/osh-infra/osh-infra-dashboards/kibana.yaml
@@ -99,21 +99,23 @@ data:
create_kibana_indexes:
enabled: true
indexes:
- - airship
- - audit_tsee
- - auth
- - calico
- - ceph
- - flows
- - jenkins
- - journal
- - kernel_syslog
- - libvirt
- - logstash
- - lma
- - openstack
- - utility_access
- - openvswitch
+ base:
+ - airship
+ - audit_tsee
+ - auth
+ - calico
+ - ceph
+ - flows
+ - jenkins
+ - journal
+ - kernel_syslog
+ - libvirt
+ - logstash
+ - lma
+ - utility_access
+ application:
+ - openstack
+ - openvswitch
default_index: logstash
kibana:
elasticsearch:
diff --git a/global/software/charts/osh/openstack-compute-kit/chart-group.yaml b/global/software/charts/osh/openstack-compute-kit/chart-group.yaml
index 6fd239081..6b76be83f 100644
--- a/global/software/charts/osh/openstack-compute-kit/chart-group.yaml
+++ b/global/software/charts/osh/openstack-compute-kit/chart-group.yaml
@@ -10,9 +10,10 @@ metadata:
layer: global
storagePolicy: cleartext
data:
- description: Deploy Nova, Neutron, Openvswitch, and Libvirt
+ description: Deploy Nova, Neutron, Openvswitch, Placement, and Libvirt
chart_group:
- libvirt
- openvswitch
- neutron
+ - placement
- nova
diff --git a/global/software/charts/osh/openstack-compute-kit/neutron.yaml b/global/software/charts/osh/openstack-compute-kit/neutron.yaml
index bc20103ae..bcf575c6f 100644
--- a/global/software/charts/osh/openstack-compute-kit/neutron.yaml
+++ b/global/software/charts/osh/openstack-compute-kit/neutron.yaml
@@ -236,7 +236,7 @@ data:
native:
enabled: false
test:
- timeout: 720
+ timeout: 1400
install:
no_hooks: false
upgrade:
diff --git a/global/software/charts/osh/openstack-compute-kit/nova.yaml b/global/software/charts/osh/openstack-compute-kit/nova.yaml
index 5cfa1a5cd..ff3acff48 100644
--- a/global/software/charts/osh/openstack-compute-kit/nova.yaml
+++ b/global/software/charts/osh/openstack-compute-kit/nova.yaml
@@ -325,6 +325,20 @@ data:
post:
create: []
values:
+ manifests:
+ # NOTE(lamt): disable consoleauth and placement from nova in Train release.
+ certificates: false
+ deployment_consoleauth: false
+ deployment_placement: false
+ ingress_placement: false
+ job_db_init_placement: false
+ job_ks_placement_endpoints: false
+ job_ks_placement_service: false
+ job_ks_placement_user: false
+ pdb_placement: false
+ secret_keystone_placement: false
+ service_ingress_placement: false
+ service_placement: false
dependencies:
static:
rabbit_init:
@@ -775,20 +789,14 @@ data:
values:
- RetryFilter
- AvailabilityZoneFilter
- - RamFilter
- - CoreFilter
- - DiskFilter
- ComputeFilter
- ImagePropertiesFilter
- ServerGroupAntiAffinityFilter
- ServerGroupAffinityFilter
- AggregateInstanceExtraSpecsFilter
- - AggregateCoreFilter
- - AggregateRamFilter
- AggregateMultiTenancyIsolation
- JsonFilter
- IoOpsFilter
- - AggregateDiskFilter
- AllHostsFilter
- IsolatedHostsFilter
- AggregateImagePropertiesIsolation
@@ -816,6 +824,7 @@ data:
key_pairs: 10
cinder:
http_retries: 6
+ catalog_info: "volumev3::internalURL"
oslo_messaging_rabbit:
heartbeat_timeout_threshold: 60
audit_middleware_notifications:
diff --git a/global/software/charts/osh/openstack-compute-kit/placement.yaml b/global/software/charts/osh/openstack-compute-kit/placement.yaml
new file mode 100644
index 000000000..f8c7f64ad
--- /dev/null
+++ b/global/software/charts/osh/openstack-compute-kit/placement.yaml
@@ -0,0 +1,416 @@
+---
+schema: armada/Chart/v1
+metadata:
+ schema: metadata/Document/v1
+ name: placement
+ labels:
+ name: placement-global
+ component: placement
+ layeringDefinition:
+ abstract: false
+ layer: global
+ storagePolicy: cleartext
+ substitutions:
+ # Chart source
+ - src:
+ schema: pegleg/SoftwareVersions/v1
+ name: software-versions
+ path: .charts.osh.placement
+ dest:
+ path: .source
+
+ # Images
+ - src:
+ schema: pegleg/SoftwareVersions/v1
+ name: software-versions
+ path: .images.osh.placement
+ dest:
+ path: .values.images.tags
+
+ # Endpoints
+ - src:
+ schema: pegleg/EndpointCatalogue/v1
+ name: osh_endpoints
+ path: .osh.identity
+ dest:
+ path: .values.endpoints.identity
+ - src:
+ schema: pegleg/EndpointCatalogue/v1
+ name: osh_endpoints
+ path: .osh.oslo_db
+ dest:
+ path: .values.endpoints.oslo_db
+ - src:
+ schema: pegleg/EndpointCatalogue/v1
+ name: osh_endpoints
+ path: .osh.oslo_messaging
+ dest:
+ path: .values.endpoints.oslo_messaging
+ - src:
+ schema: pegleg/EndpointCatalogue/v1
+ name: osh_endpoints
+ path: .osh.oslo_cache
+ dest:
+ path: .values.endpoints.oslo_cache
+ - src:
+ schema: pegleg/EndpointCatalogue/v1
+ name: osh_endpoints
+ path: .osh.placement
+ dest:
+ path: .values.endpoints.placement
+
+ # Service Accounts
+ - src:
+ schema: pegleg/AccountCatalogue/v1
+ name: osh_service_accounts
+ path: .osh.keystone.admin
+ dest:
+ path: .values.endpoints.identity.auth.admin
+ - src:
+ schema: pegleg/AccountCatalogue/v1
+ name: osh_service_accounts
+ path: .osh.placement.placement
+ dest:
+ path: .values.endpoints.identity.auth.placement
+ - src:
+ schema: pegleg/AccountCatalogue/v1
+ name: osh_service_accounts
+ path: .osh.placement.test
+ dest:
+ path: .values.endpoints.identity.auth.test
+ - src:
+ schema: pegleg/AccountCatalogue/v1
+ name: osh_service_accounts
+ path: .osh.oslo_messaging.admin
+ dest:
+ path: .values.endpoints.oslo_messaging.auth.admin
+ - src:
+ schema: pegleg/AccountCatalogue/v1
+ name: osh_service_accounts
+ path: .osh.nova.oslo_messaging.placement
+ dest:
+ path: .values.endpoints.oslo_messaging.auth.placement
+ - src:
+ schema: pegleg/AccountCatalogue/v1
+ name: osh_service_accounts
+ path: .osh.placement.oslo_db.username
+ dest:
+ path: .values.endpoints.oslo_db.auth.placement.username
+ - src:
+ schema: pegleg/AccountCatalogue/v1
+ name: osh_service_accounts
+ path: .osh.placement.oslo_db.database
+ dest:
+ path: .values.endpoints.oslo_db.path
+ pattern: DB_NAME
+
+ # Secrets
+ - dest:
+ path: .values.endpoints.identity.auth.admin.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_keystone_admin_password
+ path: .
+ - dest:
+ path: .values.endpoints.identity.auth.placement.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_placement_password
+ path: .
+ - dest:
+ path: .values.endpoints.identity.auth.test.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_nova_test_password
+ path: .
+ - dest:
+ path: .values.endpoints.identity.auth.neutron.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_neutron_password
+ path: .
+ - dest:
+ path: .values.endpoints.identity.auth.placement.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_placement_password
+ path: .
+ - dest:
+ path: .values.endpoints.identity.auth.ironic.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_ironic_password
+ path: .
+ - dest:
+ path: .values.endpoints.oslo_messaging.auth.admin.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_oslo_messaging_admin_password
+ path: .
+ - dest:
+ path: .values.endpoints.oslo_messaging.auth.placement.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_nova_oslo_messaging_password
+ path: .
+ - dest:
+ path: .values.endpoints.oslo_db.auth.placement.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_nova_oslo_db_password
+ path: .
+ - dest:
+ path: .values.endpoints.oslo_db.auth.admin.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_oslo_db_admin_password
+ path: .
+ - dest:
+ path: .values.endpoints.oslo_cache.auth.memcache_secret_key
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_oslo_cache_secret_key
+ path: .
+ - dest:
+ path: .values.endpoints.oslo_db.auth.nova_api.password
+ src:
+ schema: deckhand/Passphrase/v1
+ name: osh_nova_oslo_db_password
+ path: .
+ - dest:
+ path: .values.endpoints.oslo_db.auth.nova_api.username
+ src:
+ schema: pegleg/AccountCatalogue/v1
+ name: osh_service_accounts
+ path: .osh.nova.oslo_db.username
+
+
+data:
+ chart_name: placement
+ release: placement
+ namespace: openstack
+ wait:
+ timeout: 2700
+ labels:
+ release_group: clcp-placement
+ resources:
+ - type: job
+ - type: deployment
+ min_ready: 100%
+ native:
+ enabled: false
+ test:
+ timeout: 600
+ install:
+ no_hooks: false
+ upgrade:
+ no_hooks: false
+ pre:
+ delete:
+ - type: job
+ labels:
+ release_group: clcp-placement
+ post:
+ create: []
+ values:
+ manifests:
+ certificates: false
+ job_db_migrate: false
+ dependencies:
+ static:
+ rabbit_init:
+ services:
+ - endpoint: internal
+ service: oslo_messaging
+ jobs:
+ - clcp-openstack-rabbitmq-cluster-wait
+ db_sync:
+ jobs:
+ - placement-db-init
+ labels:
+ job:
+ node_selector_key: openstack-control-plane
+ node_selector_value: enabled
+ api:
+ node_selector_key: openstack-control-plane
+ node_selector_value: enabled
+ test:
+ node_selector_key: openstack-control-plane
+ node_selector_value: enabled
+ pod:
+ mandatory_access_control:
+ type: apparmor
+ placement-api:
+ placement-api: runtime/default
+ init: runtime/default
+ placement-db-migrate:
+ init: runtime/default
+ placement-mysql-migration: runtime/default
+ replicas:
+ api: 4
+ affinity:
+ anti:
+ type:
+ placement: requiredDuringSchedulingIgnoredDuringExecution
+ weight:
+ default: 100
+ lifecycle:
+ upgrades:
+ deployments:
+ pod_replacement_strategy: RollingUpdate
+ rolling_update:
+ max_unavailable: 50%
+ security_context:
+ placement:
+ container:
+ placement_api:
+ allowPrivilegeEscalation: false
+ network:
+ api:
+ ingress:
+ annotations:
+ nginx.ingress.kubernetes.io/backend-protocol: "https"
+ nginx.ingress.kubernetes.io/configuration-snippet: |
+ more_set_headers "X-XSS-Protection: 1; mode=block";
+ more_set_headers "X-Frame-Options: deny";
+ if ($request_method !~ ^(HEAD|GET|POST|PUT|PATCH|DELETE)$ ) {
+ return 405;
+ }
+ conf:
+ logging:
+ loggers:
+ keys:
+ - root
+ - placement
+ - oslo.messaging
+ handlers:
+ keys:
+ - stdout
+ - stderr
+ - "null"
+ formatters:
+ keys:
+ - context
+ - default
+ logger_root:
+ level: WARNING
+ handlers: "null"
+ logger_placement:
+ level: INFO
+ handlers:
+ - stdout
+ qualname: placement
+ logger_oslo.messaging:
+ level: INFO
+ handlers:
+ - stdout
+ qualname: oslo.messaging
+ logger_amqp:
+ level: WARNING
+ handlers: stderr
+ qualname: amqp
+ logger_amqplib:
+ level: WARNING
+ handlers: stderr
+ qualname: amqplib
+ logger_eventletwsgi:
+ level: WARNING
+ handlers: stderr
+ qualname: eventlet.wsgi.server
+ logger_sqlalchemy:
+ level: WARNING
+ handlers: stderr
+ qualname: sqlalchemy
+ logger_boto:
+ level: WARNING
+ handlers: stderr
+ qualname: boto
+ handler_null:
+ class: logging.NullHandler
+ formatter: default
+ args: ()
+ handler_stdout:
+ class: StreamHandler
+ args: (sys.stdout,)
+ formatter: context
+ handler_stderr:
+ class: StreamHandler
+ args: (sys.stderr,)
+ formatter: context
+ formatter_context:
+ class: oslo_log.formatters.ContextFormatter
+ formatter_default:
+ format: "%(message)s"
+ policy:
+ "context_is_admin": "role:admin"
+ "admin_or_owner": "rule:context_is_admin or project_id:%(project_id)s"
+ "default": "rule:admin_or_owner"
+ "admin_api": "role:admin"
+ "placement:resource_providers:list": "rule:admin_api"
+ "placement:resource_providers:create": "rule:admin_api"
+ "placement:resource_providers:show": "rule:admin_api"
+ "placement:resource_providers:update": "rule:admin_api"
+ "placement:resource_providers:delete": "rule:admin_api"
+ "placement:resource_classes:list": "rule:admin_api"
+ "placement:resource_classes:create": "rule:admin_api"
+ "placement:resource_classes:show": "rule:admin_api"
+ "placement:resource_classes:update": "rule:admin_api"
+ "placement:resource_classes:delete": "rule:admin_api"
+ "placement:resource_providers:inventories:list": "rule:admin_api"
+ "placement:resource_providers:inventories:create": "rule:admin_api"
+ "placement:resource_providers:inventories:show": "rule:admin_api"
+ "placement:resource_providers:inventories:update": "rule:admin_api"
+ "placement:resource_providers:inventories:delete": "rule:admin_api"
+ "placement:resource_providers:aggregates:list": "rule:admin_api"
+ "placement:resource_providers:aggregates:update": "rule:admin_api"
+ "placement:resource_providers:usages": "rule:admin_api"
+ "placement:usages": "rule:admin_api"
+ "placement:traits:list": "rule:admin_api"
+ "placement:traits:show": "rule:admin_api"
+ "placement:traits:update": "rule:admin_api"
+ "placement:traits:delete": "rule:admin_api"
+ "placement:resource_providers:traits:list": "rule:admin_api"
+ "placement:resource_providers:traits:update": "rule:admin_api"
+ "placement:resource_providers:traits:delete": "rule:admin_api"
+ "placement:allocations:manage": "rule:admin_api"
+ "placement:allocations:list": "rule:admin_api"
+ "placement:allocations:update": "rule:admin_api"
+ "placement:allocations:delete": "rule:admin_api"
+ "placement:resource_providers:allocations:list": "rule:admin_api"
+ "placement:allocation_candidates:list": "rule:admin_api"
+ "placement:reshaper:reshape": "rule:admin_api"
+ "not_implemented_in_aic": '!'
+ placement:
+ DEFAULT:
+ debug: false
+ dependencies:
+ - os-placement-htk
+...
+---
+schema: armada/Chart/v1
+metadata:
+ schema: metadata/Document/v1
+ name: os-placement-htk
+ layeringDefinition:
+ abstract: false
+ layer: global
+ substitutions:
+ - src:
+ schema: pegleg/SoftwareVersions/v1
+ name: software-versions
+ path: .charts.osh.placement-htk
+ dest:
+ path: .source
+ storagePolicy: cleartext
+data:
+ chart_name: os-placement-htk
+ release: os-placement-htk
+ namespace: os-placement-htk
+ timeout: 600
+ wait:
+ timeout: 600
+ upgrade:
+ no_hooks: true
+ values: {}
+ dependencies: []
+...
diff --git a/global/software/charts/ucp/ceph/ceph-client-update.yaml b/global/software/charts/ucp/ceph/ceph-client-update.yaml
index c7f3e7da2..666e47699 100644
--- a/global/software/charts/ucp/ceph/ceph-client-update.yaml
+++ b/global/software/charts/ucp/ceph/ceph-client-update.yaml
@@ -123,13 +123,13 @@ data:
enabled: true
script: |
set -x
- DESIRED_VERSION="octopus"
+ DESIRED_VERSION="nautilus"
ADDITIONAL_VERSIONS=1
while [ $ADDITIONAL_VERSIONS -gt 0 ]; do
sleep 5
- ADDITIONAL_VERSIONS=$(ceph tell osd.* version --format json | awk -F 'osd.[0-9]*: ' '/^osd/ { print $2}' | jq -r '.release' | uniq | grep -v ${DESIRED_VERSION} | wc -l )
+ ADDITIONAL_VERSIONS=$(ceph tell osd.* version --format json | awk -F 'osd.[0-9]*: ' '/^osd/ { print $2}' | jq -r '.version' | awk '{ print $(NF-1) }' | uniq | grep -v ${DESIRED_VERSION} | wc -l )
done
- while [[ `ceph pg stat -f json | jq -r ".pg_summary.num_pgs"` -eq 0 ]] || [[ `ceph pg ls -f json | jq -r '.pg_stats[].state' | grep -v "active"` ]]
+ while [[ `ceph pg ls | tail -n +2 | grep -v "active+\|NOTE"` ]]
do
sleep 5
done
@@ -239,9 +239,7 @@ data:
features:
# NOTE(st053q): If autoscaler is disabled, then
# mon_pg_warn_max_object_skew should not be 0 in ceph.conf
- pg_autoscaler: true
- cluster_flags:
- unset: "noup"
+ pg_autoscaler: false
pool:
spec:
# Health metrics pool
diff --git a/global/software/charts/ucp/ceph/ceph-client.yaml b/global/software/charts/ucp/ceph/ceph-client.yaml
index a1823a9a7..2325cf630 100644
--- a/global/software/charts/ucp/ceph/ceph-client.yaml
+++ b/global/software/charts/ucp/ceph/ceph-client.yaml
@@ -93,6 +93,7 @@ data:
component: test
test:
enabled: true
+ timeout: 3600
values:
labels:
job:
@@ -211,8 +212,6 @@ data:
conf:
features:
pg_autoscaler: false
- cluster_flags:
- set: "noup"
pool:
spec:
# Health metrics pool
diff --git a/global/software/config/endpoints.yaml b/global/software/config/endpoints.yaml
index 1a705bf6f..d78fcec10 100644
--- a/global/software/config/endpoints.yaml
+++ b/global/software/config/endpoints.yaml
@@ -256,6 +256,10 @@ data:
podport: 10283
status:
podport: 18089
+ stream:
+ podport: 18090
+ profiler:
+ podport: 18088
kubernetesprovisioner:
name: promenade
hosts:
diff --git a/global/software/config/versions.yaml b/global/software/config/versions.yaml
index 8aad81e42..eb1bcd084 100644
--- a/global/software/config/versions.yaml
+++ b/global/software/config/versions.yaml
@@ -201,7 +201,7 @@ data:
type: git
cinder-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
glance:
@@ -211,7 +211,7 @@ data:
type: git
glance-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
heat:
@@ -221,7 +221,7 @@ data:
type: git
heat-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
helm_toolkit:
@@ -236,7 +236,7 @@ data:
type: git
horizon-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
ingress:
@@ -251,7 +251,7 @@ data:
type: git
keystone:
location: https://opendev.org/openstack/openstack-helm
- reference: 28d0a56e46129276559a4ddb2dea32c35b10b58e
+ reference: d467d685a3863edc5fed7c352961b3235a5e3a99
subpath: keystone
type: git
keystone-htk:
@@ -266,7 +266,7 @@ data:
type: git
libvirt-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
mariadb:
@@ -276,7 +276,7 @@ data:
type: git
mariadb-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: b482b57e6ea85eceef02787cb2e8eb884cceb80c
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
memcached:
@@ -296,17 +296,17 @@ data:
type: git
neutron-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 4f30b1361e2b596ce8760fd593f08d4f9a6639fe
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
nova:
location: https://opendev.org/openstack/openstack-helm
- reference: 4aa7a3026706758d22dc3e7002a2a0bffcfd84ea
+ reference: 2ec17153c6cb918dd357f71824ec59dd0d74dfba
subpath: nova
type: git
nova-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 017c8df602cbe33ae3e70a7125ee94886136e850
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
openvswitch:
@@ -316,17 +316,27 @@ data:
type: git
openvswitch-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: d0b32ed88ad652d9c2226466a13bac8b28038399
+ reference: f08d30df6b871044135534eedf76c8f2760d9923
+ subpath: helm-toolkit
+ type: git
+ placement:
+ location: https://opendev.org/openstack/openstack-helm
+ reference: 2ec17153c6cb918dd357f71824ec59dd0d74dfba
+ subpath: placement
+ type: git
+ placement-htk:
+ location: https://opendev.org/openstack/openstack-helm-infra
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
rabbitmq:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 1a8536fd5d9c3c05a0c4b5cd0e6e4a502c9c53bc
+ reference: 5c8bd68e764b22122d6be4cbda04cfdc76223b23
subpath: rabbitmq
type: git
rabbitmq-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 832718629f3d967c0bca7f28c53f57cd5ad4ddaa
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
tempest:
@@ -352,12 +362,12 @@ data:
type: git
mariadb:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: ba601e0cba1bb584fe3bce07f96f8e5b98b12889
+ reference: 6dd39da6ad7ffd744ecff423e99637aadd9c0414
subpath: mariadb
type: git
mariadb-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: a4568f31e2e9d09c8f318a9d938c9a16f0da59ef
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
mini-mirror:
@@ -403,7 +413,7 @@ data:
osh_infra:
ceph-rgw:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 20cf2db961a05285a751b3bc96b8fa4e51e3b412
+ reference: eacf93722136636dcfbd2b68c59b71f071ffc085
subpath: ceph-rgw
type: git
ceph-rgw-htk:
@@ -413,17 +423,17 @@ data:
type: git
elasticsearch:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: a2c1eea8a982de777fa430efdf188d556630f3f0
+ reference: fd4bf572111b75f1a73396c6d3b714259b53a024
subpath: elasticsearch
type: git
elasticsearch-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: a78ee39dcb9209a4ba6cc87f2989481a9fa63fc1
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
fluentd:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 59164428d305bf72dd67733a184266fd1217c153
+ reference: ddd5a74319142b14d42271da6727e76637133869
subpath: fluentd
type: git
fluentd-htk:
@@ -433,22 +443,22 @@ data:
type: git
grafana:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 128c3f748aee3ae72cccca0ff17a71ac1ed5c2fb
+ reference: 87e3a02dd558dfca6a9a8f49feb34f47d516cbf7
subpath: grafana
type: git
grafana-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: a78ee39dcb9209a4ba6cc87f2989481a9fa63fc1
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
kibana:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: b62a46336c1b6ca86e48710ba85c9320f3075fd5
+ reference: 9a719e2a18bfd4f1daa57d1a4397d89966653b18
subpath: kibana
type: git
kibana-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: a78ee39dcb9209a4ba6cc87f2989481a9fa63fc1
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
local-storage:
@@ -488,7 +498,7 @@ data:
type: git
prometheus-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: a78ee39dcb9209a4ba6cc87f2989481a9fa63fc1
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
prometheus_kube_state_metrics:
@@ -549,7 +559,7 @@ data:
type: git
armada-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 926348fe2476051f9ca825916db333f81c0139b7
+ reference: 44947cc80b91510da6f68a434c847af2d260cabd
subpath: helm-toolkit
type: git
barbican:
@@ -559,12 +569,12 @@ data:
type: git
barbican-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: c2ece6a45aea1a4d52942eeba23b5d37de70c082
+ reference: 2b20674cad133581e1259ac87470ba0f6cca313b
subpath: helm-toolkit
type: git
ceph-client:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: dd39a0f7e08c9eee861b9fa23e9587d440b76c43
+ reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e
subpath: ceph-client
type: git
ceph-htk:
@@ -574,22 +584,22 @@ data:
type: git
ceph-mon:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 4eee89ccba75a34b222d2f828129d0d5f26ffd23
+ reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e
subpath: ceph-mon
type: git
ceph-osd:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 4ed24de14b562607742a246906b48fba647d3ce8
+ reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e
subpath: ceph-osd
type: git
ceph-provisioners:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 4ed24de14b562607742a246906b48fba647d3ce8
+ reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e
subpath: ceph-provisioners
type: git
ceph-rgw:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 20cf2db961a05285a751b3bc96b8fa4e51e3b412
+ reference: 2f8ea3977ba31a4576ffb9bf98282d0586d1aa25
subpath: ceph-rgw
type: git
deckhand:
@@ -599,7 +609,7 @@ data:
type: git
deckhand-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 926348fe2476051f9ca825916db333f81c0139b7
+ reference: 8b09a074232fd1abff26055fd975ce742bc7d71b
subpath: helm-toolkit
type: git
divingbell:
@@ -619,7 +629,7 @@ data:
type: git
drydock-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 926348fe2476051f9ca825916db333f81c0139b7
+ reference: 9061d08a5e41a94fd92e60d860bfa7464d2a3cb5
subpath: helm-toolkit
type: git
ingress:
@@ -634,7 +644,7 @@ data:
type: git
keystone:
location: https://opendev.org/openstack/openstack-helm
- reference: 28d0a56e46129276559a4ddb2dea32c35b10b58e
+ reference: d467d685a3863edc5fed7c352961b3235a5e3a99
subpath: keystone
type: git
keystone-htk:
@@ -649,7 +659,7 @@ data:
type: git
maas-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: d0f808a64e2b0340aeefcfc4c6107bc825a9fc99
+ reference: d96b724310252c259041c216e1c110062e506347
subpath: helm-toolkit
type: git
mariadb:
@@ -659,7 +669,7 @@ data:
type: git
mariadb-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: f08d30df6b871044135534eedf76c8f2760d9923
+ reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db
subpath: helm-toolkit
type: git
memcached:
@@ -679,12 +689,12 @@ data:
type: git
postgresql-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 4a770bb90846e7bd5fd32be4fcbce95b4218be01
+ reference: 25aa3690252c605d237c187524d0adf73a8424e5
subpath: helm-toolkit
type: git
promenade:
location: https://opendev.org/airship/promenade
- reference: 27f181a9d30294030d695b747b2e4560ffbd29be
+ reference: d161528ae8de0dcb0dd9d39bc370f85f2aa1c462
subpath: charts/promenade
type: git
promenade-htk:
@@ -709,12 +719,12 @@ data:
type: git
shipyard-htk:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 926348fe2476051f9ca825916db333f81c0139b7
+ reference: b50fae62a4ad0992ce877cd632800e1eed5f71a9
subpath: helm-toolkit
type: git
tenant-ceph-client:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: dd39a0f7e08c9eee861b9fa23e9587d440b76c43
+ reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e
subpath: ceph-client
type: git
tenant-ceph-htk:
@@ -724,22 +734,22 @@ data:
type: git
tenant-ceph-mon:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 4eee89ccba75a34b222d2f828129d0d5f26ffd23
+ reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e
subpath: ceph-mon
type: git
tenant-ceph-osd:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 4ed24de14b562607742a246906b48fba647d3ce8
+ reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e
subpath: ceph-osd
type: git
tenant-ceph-provisioners:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 4ed24de14b562607742a246906b48fba647d3ce8
+ reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e
subpath: ceph-provisioners
type: git
tenant-ceph-rgw:
location: https://opendev.org/openstack/openstack-helm-infra
- reference: 20cf2db961a05285a751b3bc96b8fa4e51e3b412
+ reference: 2f8ea3977ba31a4576ffb9bf98282d0586d1aa25
subpath: ceph-rgw
type: git
tiller:
@@ -832,11 +842,12 @@ data:
busybox: &busybox docker.io/busybox:1.28.3
alpine-38: &alpine-38 docker.io/alpine:3.8
airflow: &airflow quay.io/airshipit/airflow:f0f876afef07f62cd38fbce8b775cfc741e0bf52-ubuntu_xenial
- armada: &armada quay.io/airshipit/armada:7ef4b8643b5ec5216a8f6726841e156c0aa54a1a-ubuntu_bionic
+ #armada: &armada quay.io/airshipit/armada:7ef4b8643b5ec5216a8f6726841e156c0aa54a1a-ubuntu_bionic
+ armada: &armada quay.io/airshipit/armada:b37417253f99f23549e09502e3bcd81d450bb4c4-ubuntu_bionic
barbican: &barbican docker.io/openstackhelm/barbican@sha256:4c44bb9e5d29224007b2ef52c1ce4ff756e655efe9c6e9a95b2e98f4f501499e
#ceph_daemon: &ceph_daemon docker.io/openstackhelm/ceph-daemon:ubuntu_bionic-20191216
- ceph_daemon: &ceph_daemon docker.io/openstackhelm/ceph-daemon:ubuntu_bionic-20210902
+ ceph_daemon: &ceph_daemon docker.io/openstackhelm/ceph-daemon:ubuntu_bionic-20200521
ceph-utility: &ceph-utility quay.io/airshipit/porthole-ceph-utility:e7a6644b3af8bddd94d20ca35f388ae605203416-ubuntu_bionic
@@ -855,15 +866,15 @@ data:
curator: &curator docker.io/bobrik/curator:5.8.1
- deckhand: &deckhand quay.io/airshipit/deckhand:90f653bc0fa9f2c910d05a3c00d2c339c064638d-ubuntu_xenial
+ deckhand: &deckhand quay.io/airshipit/deckhand:5cd799cc5d04527ac782270008ff647b3779ff05-ubuntu_bionic
- dep_check: &dep_check quay.io/stackanetes/kubernetes-entrypoint:v0.3.1
+ dep_check: &dep_check quay.io/airshipit/kubernetes-entrypoint:v1.0.0
- drydock: &drydock quay.io/airshipit/drydock:dfe7c0508d27f517bf29cd2f37b7f07b112edb4e
+ drydock: &drydock quay.io/airshipit/drydock:aa0cf8c8d09ad37b8ebcce677064e1b3b2211758-ubuntu_bionic
elasticsearch: &elasticsearch docker.io/openstackhelm/elasticsearch-s3:7_1_0-20191119
- etcd: &etcd quay.io/coreos/etcd:v3.4.8
+ etcd: &etcd quay.io/coreos/etcd:v3.4.15
etcdctl: &etcdctl-utility quay.io/airshipit/porthole-etcdctl-utility:e7a6644b3af8bddd94d20ca35f388ae605203416-ubuntu_bionic
@@ -889,35 +900,34 @@ data:
ingress_error_pages_404: &ingress_error_pages_404 gcr.io/google-containers/ingress-gce-404-server-with-metrics-amd64:v1.6.0@sha256:d83d8a481145d0eb71f8bd71ae236d1c6a931dd3bdcaf80919a8ec4a4d8aff74
- ingress_controller_mariadb: &ingress_controller_mariadb quay.io/kubernetes-ingress-controller/nginx-ingress-controller:0.32.0
+ ingress_controller_mariadb: &ingress_controller_mariadb k8s.gcr.io/ingress-nginx/controller:v0.48.1
k8s-keystone-auth: &k8s-keystone-auth docker.io/k8scloudprovider/k8s-keystone-auth:v1.18.0
- kibana: &kibana docker.elastic.co/kibana/kibana-oss:7.9.2
+ kibana: &kibana docker.elastic.co/kibana/kibana-oss:7.1.0
libvirt: &libvirt docker.io/openstackhelm/libvirt:ubuntu_bionic-20210227
- mariadb_db: &mariadb_db docker.io/openstackhelm/mariadb:10.2.18
+ mariadb_db: &mariadb_db docker.io/openstackhelm/mariadb:ubuntu_xenial-20200811
- maas_rack_controller: &maas_rack_controller quay.io/airshipit/maas-rack-controller:840b482373df163ba088b91c278f2a58fd599b7b
+ maas_rack_controller: &maas_rack_controller quay.io/airshipit/maas-rack-controller:94e55069dc17606e0c3b585d7e901ee0bf372f29
- maas_region_controller: &maas_region_controller quay.io/airshipit/maas-region-controller:840b482373df163ba088b91c278f2a58fd599b7b
+ maas_region_controller: &maas_region_controller quay.io/airshipit/maas-region-controller:94e55069dc17606e0c3b585d7e901ee0bf372f29
maas_ingress: &maas_ingress docker-prod-local.artifactory.mirantis.com/mirantis/kubernetes-ingress-nginx/nginx-ingress-controller-amd64@sha256:fe510f97b02566e21685b7b108422370ca67a8a44099ce7e968a778c0ba06e0b
memcached: &memcached docker.io/library/memcached:1.6.6-alpine
#mos_cinder: &mos_cinder openstackhelm/cinder:stein-ubuntu_bionic-20200513
mos_cinder: &mos_cinder docker.io/openstackhelm/cinder:train-ubuntu_bionic-20200612
- mos_cinder_storage_init: &mos_cinder_storage_init docker.io/openstackhelm/ceph-config-helper:ubuntu_bionic-20200416
+ mos_cinder_storage_init: &mos_cinder_storage_init docker.io/openstackhelm/ceph-config-helper:ubuntu_bionic-20220603
#mos_glance: &mos_glance openstackhelm/glance:stein-ubuntu_bionic-20200513
mos_glance: &mos_glance docker.io/openstackhelm/glance:train-ubuntu_bionic-20200612
- #mos_heat: &mos_heat docker.io/deepakdt/heat:stein-ubuntu_bionic-taas
- mos_heat: &mos_heat docker.io/openstackhelm/heat:train-ubuntu_bionic-20200612
+ mos_heat: &mos_heat docker.io/openstackhelm/heat:stein-ubuntu_bionic
mos_heat_nova: &mos_heat_nova docker.io/openstackhelm/heat:train-ubuntu_bionic-20200612
- mos_horizon: &mos_horizon docker.io/openstackhelm/horizon:train-ubuntu_bionic-20200612
+ mos_horizon: &mos_horizon docker.io/openstackhelm/horizon:train-ubuntu_bionic
mos_keystone: &mos_keystone docker.io/openstackhelm/keystone:train-ubuntu_bionic-20200612
#mos_neutron: &mos_neutron docker.io/imarijitbose/stein_neutron_bionic
@@ -933,22 +943,25 @@ data:
nova_spiceproxy: &nova_spiceproxy docker.io/openstackhelm/nova:train-ubuntu_bionic-20200612
#openvswitch: &openvswitch docker.io/deepakdt/openvswitch:ovs2.11.1-dpdk18.11.3-ubuntu_bionic-dpdk
- openvswitch: &openvswitch docker.io/openstackhelm/openvswitch:ubuntu_bionic-20200722
+ openvswitch: &openvswitch docker.io/openstackhelm/openvswitch:ubuntu_bionic-dpdk-20220725
openstack-utility: &openstack-utility quay.io/airshipit/porthole-openstack-utility:e7a6644b3af8bddd94d20ca35f388ae605203416-ubuntu_bionic
pegleg: &pegleg quay.io/airshipit/pegleg@sha256:0ca3b708c37425e4e05627443dbd39d2ed27cf06193d2cc3bcb5b985b260d79d
+
+ mos_placement: &mos_placement docker.io/openstackhelm/placement:periodic_train-ubuntu_bionic-20220309
+
nc-swissknife: &nc-swissknife quay.io/airshipit/pegleg@sha256:0ca3b708c37425e4e05627443dbd39d2ed27cf06193d2cc3bcb5b985b260d79d
patroni: &patroni docker-prod-local.artifactory.mirantis.com/nc/patroni:9.6.15-bionic-1567439806207
- postgres: &postgres docker-prod-local.artifactory.mirantis.com/nc/postgresql:9.6.15-debian-1566552796302
+ postgres: &postgres docker.io/postgres:9.6
promenade: &promenade quay.io/airshipit/promenade:b65930f205b77f28507dee9296aead00e24f2a18
divingbell: &divingbell docker.io/ubuntu:16.04
prometheus: &prometheus docker.io/prom/prometheus:v2.12.0
- prometheus_elasticsearch_exporter: &prometheus_elasticsearch_exporter docker.io/justwatch/elasticsearch_exporter:1.0.1
+ prometheus_elasticsearch_exporter: &prometheus_elasticsearch_exporter docker.io/justwatch/elasticsearch_exporter:1.1.0
prometheus_fluentd_exporter: &prometheus_fluentd_exporter docker.io/bitnami/fluentd-exporter:0.2.0
prometheus_memcached_exporter: &prometheus_memcached_exporter docker.io/prom/memcached-exporter:v0.4.1
prometheus_mysql_exporter: &prometheus_mysql_exporter docker.io/prom/mysqld-exporter:v0.10.0
@@ -958,12 +971,12 @@ data:
rabbitmq_mgmt: &rabbitmq_mgmt docker.io/library/rabbitmq:3.7.15-management
rabbitmq: &rabbitmq docker.io/library/rabbitmq:3.7.15
rabbitmq_exporter: &rabbitmq_exporter docker.io/kbudde/rabbitmq-exporter:v1.0.0-RC7.1
- rally_test: &rally_test docker.io/xrally/xrally-openstack:1.3.0
+ rally_test: &rally_test docker.io/xrally/xrally-openstack:2.0.0
#rbd_provisioner: &rbd_provisioner docker.io/openstackhelm/ceph-rbd-provisioner:ubuntu_bionic-20191216
rbd_provisioner: &rbd_provisioner docker.io/openstackhelm/ceph-rbd-provisioner:ubuntu_bionic-20200521
selenium_tests: &selenium_tests docker.io/openstackhelm/osh-selenium:ubuntu_bionic-20191017
shipyard: &shipyard quay.io/airshipit/shipyard:0b29f89d3fc284fe483c58f102574c687034468d-ubuntu_xenial
- sstream_cache: &sstream_cache quay.io/airshipit/sstream-cache:03ebbaaca3f38ab49a5993b506761a4abfd19d89
+ sstream_cache: &sstream_cache quay.io/airshipit/sstream-cache:3accf71685ed980ed8c5c07fd8c59306c012dcd2
#storage_init: &storage_init docker.io/openstackhelm/ceph-config-helper:ubuntu_bionic-20191216
storage_init: &storage_init docker.io/openstackhelm/ceph-config-helper:ubuntu_bionic-20200521
@@ -985,7 +998,7 @@ data:
kubernetes_test: &kubernetes_test docker.io/python:3.6
kubernetes_pause: &kubernetes_pause gcr.io/google_containers/pause-amd64:3.1
- grafana: &grafana docker.io/grafana/grafana:6.2.0
+ grafana: &grafana docker.io/grafana/grafana:7.3.6
# TODO: Move this under the images_refs.images header for consistency
keystone: &ref_keystone
@@ -1309,6 +1322,15 @@ data:
openvswitch_db_server: *openvswitch
openvswitch_vswitchd: *openvswitch
dep_check: *dep_check
+ placement:
+ bootstrap: *mos_heat
+ <<: *ref_keystone
+ db_migrate: *mos_placement
+ db_drop: *mos_heat
+ db_init: *mos_heat
+ dep_check: *dep_check
+ placement: *mos_placement
+ placement_db_sync: *mos_placement
rabbitmq:
prometheus_rabbitmq_exporter: *rabbitmq_exporter
prometheus_rabbitmq_exporter_helm_tests: *mos_heat
@@ -1722,7 +1744,7 @@ data:
- main
gpgkey: ""
named:
- runtime: containerd=1.5.2-0ubuntu1~18.04.2
+ runtime: containerd=1.5.5-0ubuntu3~18.04.2
socat: socat
unnamed:
- bsd-mailx
@@ -1744,5 +1766,6 @@ data:
# NC release to reboot the nodes after the completion of the Shipyard site-update. In
# the MOP update, you should also link to the following wiki page:
# https://wiki.web.att.com/display/CCPdev/i40e+Driver+upgrades
- location: https://netactuate.dl.sourceforge.net/project/e1000/i40e%20stable/2.12.6/i40e-2.12.6.tar.gz
+ #location: https://netactuate.dl.sourceforge.net/project/e1000/i40e%20stable/2.12.6/i40e-2.12.6.tar.gz
+ location: https://sourceforge.net/projects/e1000/files/unsupported/i40e%20unsupported/i40e-2.12.6.3/i40e-2.12.6.3.tar.gz
...
diff --git a/type/cruiser/software/charts/ucp/core/scaled-charts.yaml b/type/cruiser/software/charts/ucp/core/scaled-charts.yaml
index c565de28f..22682b271 100644
--- a/type/cruiser/software/charts/ucp/core/scaled-charts.yaml
+++ b/type/cruiser/software/charts/ucp/core/scaled-charts.yaml
@@ -87,5 +87,5 @@ data:
values:
pod:
replicas:
- server: 3
+ server: 1
...
diff --git a/type/cruiser/software/config/endpoints.yaml b/type/cruiser/software/config/endpoints.yaml
index d64144f48..18bc2a1b5 100644
--- a/type/cruiser/software/config/endpoints.yaml
+++ b/type/cruiser/software/config/endpoints.yaml
@@ -285,6 +285,7 @@ data:
default: 8088
public: 443
oslo_db:
+ namespace: openstack
hosts:
default: mariadb
discovery: mariadb-discovery
diff --git a/type/cruiser/software/config/service_accounts.yaml b/type/cruiser/software/config/service_accounts.yaml
index f704e82c7..7dce22c39 100644
--- a/type/cruiser/software/config/service_accounts.yaml
+++ b/type/cruiser/software/config/service_accounts.yaml
@@ -32,6 +32,8 @@ metadata:
- path: .osh.nova.nova.region_name
- path: .osh.nova.test.region_name
- path: .osh.nova.placement.region_name
+ - path: .osh.placement.placement.region_name
+ - path: .osh.placement.test.region_name
- path: .osh.barbican.barbican.region_name
- path: .osh.horizon.admin.region_name
data:
@@ -159,6 +161,25 @@ data:
oslo_messaging:
neutron:
username: neutron-rabbitmq-user
+ placement:
+ placement:
+ role: admin
+ username: placement
+ project_name: service
+ user_domain_name: default
+ project_domain_name: default
+ test:
+ role: admin
+ username: placement-test
+ project_name: test
+ user_domain_name: service
+ project_domain_name: service
+ oslo_db:
+ username: placement
+ database: placement
+ oslo_messaging:
+ placement:
+ username: placement-rabbitmq-user
nova:
nova:
role: admin
@@ -190,6 +211,8 @@ data:
oslo_messaging:
nova:
username: nova-rabbitmq-user
+ placement:
+ username: nova-rabbitmq-user
horizon:
admin:
username: admin