diff --git a/doc/source/conf.py b/doc/source/conf.py index a30be6875..cb4d2f6cd 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -68,7 +68,7 @@ release = u'0.1.0' # # This is also used if you do content translation via gettext catalogs. # Usually you set "language" from the command line for these cases. -language = None +language = 'en' # List of patterns, relative to source directory, that match files and # directories to ignore when looking for source files. diff --git a/global/schemas/pegleg/AccountCatalogue/v1.yaml b/global/schemas/pegleg/AccountCatalogue/v1.yaml index 681aed425..b7dacafc8 100644 --- a/global/schemas/pegleg/AccountCatalogue/v1.yaml +++ b/global/schemas/pegleg/AccountCatalogue/v1.yaml @@ -631,6 +631,11 @@ data: properties: username: type: string + placement: + type: object + properties: + username: + type: string oslo_db: type: object properties: @@ -652,6 +657,44 @@ data: type: string database: type: string + placement: + type: object + properties: + placement: + type: object + properties: + role: + type: string + region_name: + type: string + username: + type: string + project_name: + type: string + user_domain_name: + type: string + project_domain_name: + type: string + oslo_messaging: + type: object + properties: + admin: + type: object + properties: + username: + type: string + placement: + type: object + properties: + username: + type: string + oslo_db: + type: object + properties: + username: + type: string + database: + type: string horizon: type: object properties: diff --git a/global/software/charts/osh-infra/osh-infra-dashboards/grafana.yaml b/global/software/charts/osh-infra/osh-infra-dashboards/grafana.yaml index 3961986ad..2c2dce691 100644 --- a/global/software/charts/osh-infra/osh-infra-dashboards/grafana.yaml +++ b/global/software/charts/osh-infra/osh-infra-dashboards/grafana.yaml @@ -305,17454 +305,40363 @@ data: group_dn = "*" org_role = "Viewer" dashboards: - calico: - __inputs: - - name: prometheus - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 5.0.0 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - annotations: - list: - - builtIn: 1 - datasource: "-- Grafana --" - enable: true - hide: true - iconColor: rgba(0, 211, 255, 1) - name: Annotations & Alerts - type: dashboard - description: Calico cluster monitoring dashboard - editable: false - gnetId: 3244 - graphTooltip: 0 - id: - links: [] - panels: - - collapsed: false - gridPos: - h: 1 - w: 24 - x: 0 - 'y': 0 - id: 15 - panels: [] - repeat: - title: Felix - type: row - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 1 - id: 1 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_active_local_endpoints - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active Local Endpoints - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 1 - id: 3 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_active_local_policies - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active Local Policies - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 8 - id: 2 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_active_local_selectors - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active Local Selectors - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 8 - id: 4 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_active_local_tags - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active Local Tags - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 15 - id: 5 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_cluster_num_host_endpoints - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Cluster Host Endpoints - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 15 - id: 6 - legend: - alignAsTable: true - avg: false - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_cluster_num_workload_endpoints - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Cluster Workload Endpoints - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 22 - id: 7 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_cluster_num_hosts - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Clusters Hosts - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 22 - id: 8 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_ipsets_calico - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active IP Sets - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 29 - id: 9 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_iptables_chains - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Active IP Tables Chains - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 29 - id: 10 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_ipset_errors - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: IP Set Command Failures - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 36 - id: 11 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_iptables_save_errors - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: IP Tables Save Errors - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 36 - id: 12 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_iptables_restore_errors - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: IP Tables Restore Errors - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 0 - 'y': 43 - id: 13 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_resyncs_started - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Felix Resyncing Datastore - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - gridPos: - h: 7 - w: 12 - x: 12 - 'y': 43 - id: 14 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - expr: felix_int_dataplane_failures - format: time_series - intervalFactor: 2 - legendFormat: "{{instance}}" - refId: A - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Dataplane failed updates - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - refresh: 5m - schemaVersion: 16 - style: dark - tags: - - calico - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: utc - title: Kubernetes Calico - version: 2 - ceph_cluster: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: Prometheus.IO - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: panel - id: graph - name: Graph - version: '' - - type: grafana - id: grafana - name: Grafana - version: 3.1.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - id: - title: Ceph - Cluster - tags: - - ceph - - cluster - style: dark - timezone: browser - editable: true - hideControls: false - sharedCrosshair: false - rows: - - collapse: false - editable: true - height: 150px - panels: - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 21 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: ceph_health_status{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '1,1' - title: Status - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - - op: "=" - text: HEALTHY - value: '0' - - op: "=" - text: WARNING - value: '1' - - op: "=" - text: CRITICAL - value: '2' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 22 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: count(ceph_pool_max_avail{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '' - title: Pools - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 33 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: 0.025,0.1 - title: Cluster Capacity - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 34 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: ceph_cluster_total_used_bytes{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: 0.025,0.1 - title: Used Capacity - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percentunit - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 23 - interval: 1m - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: ceph_cluster_total_used_bytes/ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '70,80' - title: Current Utilization - transparent: false - type: singlestat - valueFontSize: 100% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - title: New row - - collapse: false - editable: true - height: 100px - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 26 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum(ceph_osd_in{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '' - title: OSDs IN - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 40, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 27 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"}) - sum(ceph_osd_in{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '1,1' - title: OSDs OUT - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 28 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum(ceph_osd_up{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '' - title: OSDs UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 40, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 29 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"}) - sum(ceph_osd_up{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '1,1' - title: OSDs DOWN - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 30 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: avg(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '250,300' - title: Average PGs per OSD - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - title: New row - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: - Available: "#EAB839" - Total Capacity: "#447EBC" - Used: "#BF1B00" - total_avail: "#6ED0E0" - total_space: "#7EB26D" - total_used: "#890F02" - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 4 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '300' - id: 1 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 0 - links: [] - minSpan: - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: Total Capacity - fill: 0 - linewidth: 3 - stack: false - span: 4 - stack: true - steppedLine: false - targets: - - expr: ceph_cluster_total_bytes{application="ceph",release_group="$ceph_cluster"} - ceph_cluster_total_used_bytes{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Available - refId: A - step: 60 - - expr: ceph_cluster_total_used_bytes - interval: "$interval" - intervalFactor: 1 - legendFormat: Used - refId: B - step: 60 - - expr: ceph_cluster_total_bytes - interval: "$interval" - intervalFactor: 1 - legendFormat: Total Capacity - refId: C - step: 60 - timeFrom: - timeShift: - title: Capacity - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Total Capacity: "#7EB26D" - Used: "#BF1B00" - total_avail: "#6ED0E0" - total_space: "#7EB26D" - total_used: "#890F02" - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - thresholdLine: false - height: '300' - id: 3 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - minSpan: - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: true - steppedLine: false - targets: - - expr: sum(ceph_osd_op_w{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Write - refId: A - step: 60 - - expr: sum(ceph_osd_op_r{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Read - refId: B - step: 60 - timeFrom: - timeShift: - title: IOPS - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: none - label: '' - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '300' - id: 7 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: true - steppedLine: false - targets: - - expr: sum(ceph_osd_op_in_bytes{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Write - refId: A - step: 60 - - expr: sum(ceph_osd_op_out_bytes{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Read - refId: B - step: 60 - timeFrom: - timeShift: - title: Throughput - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - repeat: - showTitle: true - title: CLUSTER - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 18 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Total.*$/" - stack: false - span: 12 - stack: true - steppedLine: false - targets: - - expr: ceph_cluster_total_objects{application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Total - refId: A - step: 60 - timeFrom: - timeShift: - title: Objects in the Cluster - tooltip: - msResolution: false - shared: true - sort: 1 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 19 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Total.*$/" - stack: false - span: 6 - stack: true - steppedLine: false - targets: - - expr: sum(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Total - refId: A - step: 60 - - expr: sum(ceph_pg_active{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Active - refId: B - step: 60 - - expr: sum(ceph_pg_inconsistent{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Inconsistent - refId: C - step: 60 - - expr: sum(ceph_pg_creating{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Creating - refId: D - step: 60 - - expr: sum(ceph_pg_recovering{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Recovering - refId: E - step: 60 - - expr: sum(ceph_pg_down{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Down - refId: F - step: 60 - timeFrom: - timeShift: - title: PGs - tooltip: - msResolution: false - shared: true - sort: 1 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 20 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Total.*$/" - stack: false - span: 6 - stack: true - steppedLine: false - targets: - - expr: sum(ceph_pg_degraded{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Degraded - refId: A - step: 60 - - expr: sum(ceph_pg_stale{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Stale - refId: B - step: 60 - - expr: sum(ceph_pg_undersized{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Undersized - refId: C - step: 60 - timeFrom: - timeShift: - title: Stuck PGs - tooltip: - msResolution: false - shared: true - sort: 1 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - title: New row - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: {} - hide: 0 - label: Cluster - name: ceph_cluster - options: [] - type: query - query: label_values(ceph_health_status, release_group) - refresh: 1 - sort: 2 - datasource: "${DS_PROMETHEUS}" - - auto: true - auto_count: 10 - auto_min: 1m - current: - tags: [] - text: 1m - value: 1m - datasource: - hide: 0 - includeAll: false - label: Interval - multi: false - name: interval - options: - - selected: false - text: auto - value: "$__auto_interval" - - selected: true - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 0 - type: interval - annotations: - list: [] - refresh: 5m - schemaVersion: 12 - version: 26 - links: [] - gnetId: 917 - description: "Ceph Cluster overview.\r\n" - ceph_osd: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: Prometheus.IO - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: panel - id: graph - name: Graph - version: '' - - type: grafana - id: grafana - name: Grafana - version: 3.1.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - id: - title: Ceph - OSD - tags: - - ceph - - osd - style: dark - timezone: browser - editable: true - hideControls: false - sharedCrosshair: false - rows: - - collapse: false - editable: true - height: 100px - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 40, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 6 - interval: - isNew: true - links: [] - mappingType: 2 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - - from: '0' - text: DOWN - to: '0.99' - - from: '0.99' - text: UP - to: '1' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: ceph_osd_up{ceph_daemon="$osd",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '0,1' - timeFrom: - title: Status - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: DOWN - value: '0' - - op: "=" - text: UP - value: '1' - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 40, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 8 - interval: - isNew: true - links: [] - mappingType: 2 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - - from: '0' - text: OUT - to: '0.99' - - from: '0.99' - text: IN - to: '1' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: ceph_osd_in{ceph_daemon="$osd",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '0,1' - timeFrom: - title: Available - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: DOWN - value: '0' - - op: "=" - text: UP - value: '1' - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 10 - interval: - isNew: true - links: [] - mappingType: 2 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: count(ceph_osd_metadata{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '0,1' - timeFrom: - title: Total OSDs - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: DOWN - value: '0' - - op: "=" - text: UP - value: '1' - - op: "=" - text: N/A - value: 'null' - valueName: current - title: New row - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: 250 - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: 300 - threshold2Color: rgba(234, 112, 112, 0.22) - thresholdLine: true - id: 5 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Average.*/" - fill: 0 - stack: false - span: 10 - stack: true - steppedLine: false - targets: - - expr: ceph_osd_numpg{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Number of PGs - {{ $osd }} - refId: A - step: 60 - - expr: avg(ceph_osd_numpg{application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Average Number of PGs in the Cluster - refId: B - step: 60 - timeFrom: - timeShift: - title: PGs - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 7 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: true - targets: - - expr: (ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}/ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"})*100 - interval: "$interval" - intervalFactor: 1 - legendFormat: '' - refId: A - step: 60 - thresholds: '60,80' - timeFrom: - title: Utilization - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - showTitle: true - title: 'OSD: $osd' - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 2 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: true - steppedLine: false - targets: - - expr: ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Used - {{ osd.$osd }} - metric: ceph_osd_used_bytes - refId: A - step: 60 - - expr: ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"} - hide: false - interval: "$interval" - intervalFactor: 1 - legendFormat: Available - {{ $osd }} - metric: ceph_osd_avail_bytes - refId: B - step: 60 - timeFrom: - timeShift: - title: OSD Storage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 5 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 9 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: false - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 2 - points: true - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: (ceph_osd_stat_bytes_used{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}/ceph_osd_stat_bytes{ceph_daemon=~"$osd",application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - legendFormat: Available - {{ $osd }} - metric: ceph_osd_avail_bytes - refId: A - step: 60 - timeFrom: - timeShift: - title: Utilization Variance - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: none - label: - logBase: 1 - max: - min: - show: true - - format: none - label: - logBase: 1 - max: - min: - show: true - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: {} - hide: 0 - label: Cluster - name: ceph_cluster - options: [] - type: query - query: label_values(ceph_health_status, release_group) - refresh: 1 - sort: 2 - datasource: "${DS_PROMETHEUS}" - - auto: true - auto_count: 10 - auto_min: 1m - current: - selected: true - text: 1m - value: 1m - datasource: - hide: 0 - includeAll: false - label: Interval - multi: false - name: interval - options: - - selected: false - text: auto - value: "$__auto_interval" - - selected: true - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 0 - type: interval - - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: OSD - multi: false - name: osd - options: [] - query: label_values(ceph_osd_metadata{release_group="$ceph_cluster"}, ceph_daemon) - refresh: 1 - regex: '' - type: query - annotations: - list: [] - refresh: 15m - schemaVersion: 12 - version: 18 - links: [] - gnetId: 923 - description: CEPH OSD Status. - ceph_pool: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: Prometheus.IO - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: panel - id: graph - name: Graph - version: '' - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: grafana - id: grafana - name: Grafana - version: 3.1.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - id: - title: Ceph - Pools - tags: - - ceph - - pools - style: dark - timezone: browser - editable: true - hideControls: false - sharedCrosshair: false - rows: - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 4 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 2 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - rightSide: true - show: true - total: false - values: true - lines: true - linewidth: 0 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/^Total.*$/" - fill: 0 - linewidth: 4 - stack: false - - alias: "/^Raw.*$/" - color: "#BF1B00" - fill: 0 - linewidth: 4 - span: 10 - stack: true - steppedLine: false - targets: - - expr: ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Total - {{ $pool }} - refId: A - step: 60 - - expr: ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Used - {{ $pool }} - refId: B - step: 60 - - expr: ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Available - {{ $pool }} - refId: C - step: 60 - - expr: ceph_pool_raw_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Raw - {{ $pool }} - refId: D - step: 60 - timeFrom: - timeShift: - title: "[[pool_name]] Pool Storage" - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: percentunit - gauge: - maxValue: 1 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 10 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: (ceph_pool_bytes_used{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} / ceph_pool_max_avail{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}) - interval: "$interval" - intervalFactor: 1 - refId: A - step: 60 - thresholds: '' - title: "[[pool_name]] Pool Usage" - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - showTitle: true - title: 'Pool: $pool' - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 7 - isNew: true - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: ceph_pool_objects{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Objects - {{ $pool_name }} - refId: A - step: 60 - - expr: ceph_pool_dirty{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"} - interval: "$interval" - intervalFactor: 1 - legendFormat: Dirty Objects - {{ $pool_name }} - refId: B - step: 60 - timeFrom: - timeShift: - title: Objects in Pool [[pool_name]] - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - thresholdLine: false - id: 4 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: true - steppedLine: false - targets: - - expr: irate(ceph_pool_rd{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}[3m]) - interval: "$interval" - intervalFactor: 1 - legendFormat: Read - {{ $pool_name }} - refId: B - step: 60 - - expr: irate(ceph_pool_wr{pool_id=~"$pool",application="ceph",release_group="$ceph_cluster"}[3m]) - interval: "$interval" - intervalFactor: 1 - legendFormat: Write - {{ $pool_name }} - refId: A - step: 60 - timeFrom: - timeShift: - title: "[[pool_name]] Pool IOPS" - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: none - label: IOPS - logBase: 1 - max: - min: 0 - show: true - - format: short - label: IOPS - logBase: 1 - max: - min: 0 - show: false - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 5 - interval: "$interval" - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: true - steppedLine: false - targets: - - expr: irate(ceph_pool_rd_bytes{pool_id="$pool",application="ceph",release_group="$ceph_cluster"}[3m]) - interval: "$interval" - intervalFactor: 1 - legendFormat: Read Bytes - {{ $pool_name }} - refId: A - step: 60 - - expr: irate(ceph_pool_wr_bytes{pool_id="$pool",application="ceph",release_group="$ceph_cluster"}[3m]) - interval: "$interval" - intervalFactor: 1 - legendFormat: Written Bytes - {{ $pool_name }} - refId: B - step: 60 - timeFrom: - timeShift: - title: "[[pool_name]] Pool Throughput" - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: 0 - show: true - - format: Bps - label: - logBase: 1 - max: - min: 0 - show: true - title: New row - time: - from: now-3h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: {} - hide: 0 - label: Cluster - name: ceph_cluster - options: [] - type: query - query: label_values(ceph_health_status, release_group) - refresh: 1 - sort: 2 - datasource: "${DS_PROMETHEUS}" - - auto: true - auto_count: 10 - auto_min: 1m - current: - selected: true - text: 1m - value: 1m - datasource: - hide: 0 - includeAll: false - label: Interval - multi: false - name: interval - options: - - selected: false - text: auto - value: "$__auto_interval" - - selected: true - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 0 - type: interval - - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Pool - multi: false - name: pool - options: [] - query: label_values(ceph_pool_objects{release_group="$ceph_cluster"}, pool_id) - refresh: 1 - regex: '' - type: query - - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Pool - multi: false - name: pool_name - options: [] - query: label_values(ceph_pool_metadata{release_group="$ceph_cluster",pool_id="[[pool]]" }, name) - refresh: 1 - regex: '' - type: query - annotations: - list: [] - refresh: 5m - schemaVersion: 12 - version: 22 - links: [] - gnetId: 926 - description: Ceph Pools dashboard. - containers: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: panel - id: graph - name: Graph - version: '' - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: grafana - id: grafana - name: Grafana - version: 3.1.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.3.0 - id: - title: Container Metrics (cAdvisor) - description: Monitors Kubernetes cluster using Prometheus. Shows overall cluster CPU - / Memory / Filesystem usage as well as individual pod, containers, systemd services - statistics. Uses cAdvisor metrics only. - tags: - - kubernetes - style: dark - timezone: browser - editable: true - hideControls: false - sharedCrosshair: false - rows: - - collapse: false - editable: true - height: 200px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - thresholdLine: false - height: 200px - id: 32 - isNew: true - legend: - alignAsTable: false - avg: true - current: true - max: false - min: false - rightSide: false - show: false - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum (rate (container_network_receive_bytes_total{kubernetes_io_hostname=~"^$Node$"}[5m])) - interval: 10s - intervalFactor: 1 - legendFormat: Received - metric: network - refId: A - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{kubernetes_io_hostname=~"^$Node$"}[5m]))' - interval: 10s - intervalFactor: 1 - legendFormat: Sent - metric: network - refId: B - step: 10 - timeFrom: - timeShift: - title: Network I/O pressure - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: - show: true - - format: Bps - label: - logBase: 1 - max: - min: - show: false - title: Network I/O pressure - - collapse: false - editable: true - height: 250px - panels: - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - height: 180px - id: 4 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_memory_working_set_bytes{id="/",kubernetes_io_hostname=~"^$Node$"}) - / sum (machine_memory_bytes{kubernetes_io_hostname=~"^$Node$"}) * 100 - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: 65, 90 - title: Cluster memory usage - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - height: 180px - id: 6 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{id="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - / sum (machine_cpu_cores{kubernetes_io_hostname=~"^$Node$"}) * 100 - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: 65, 90 - title: Cluster CPU usage (5m avg) - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - height: 180px - id: 7 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_fs_usage_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"}) - / sum (container_fs_limit_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"}) - * 100 - interval: 10s - intervalFactor: 1 - legendFormat: '' - metric: '' - refId: A - step: 10 - thresholds: 65, 90 - title: Cluster filesystem usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 9 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 20% - prefix: '' - prefixFontSize: 20% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_memory_working_set_bytes{id="/",kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Used - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 10 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (machine_memory_bytes{kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Total - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 11 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: " cores" - postfixFontSize: 30% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{id="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Used - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 12 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: " cores" - postfixFontSize: 30% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (machine_cpu_cores{kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Total - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 13 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_fs_usage_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Used - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - format: bytes - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: 1px - id: 14 - interval: - isNew: true - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: sum (container_fs_limit_bytes{device=~"^/dev/[sv]da[0-9]$",id=~"/.+",kubernetes_io_hostname=~"^$Node$"}) - interval: 10s - intervalFactor: 1 - refId: A - step: 10 - thresholds: '' - title: Total - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - showTitle: false - title: Total usage - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 3 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 17 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{image!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (pod) - interval: 10s - intervalFactor: 1 - legendFormat: "{{ pod }}" - metric: container_cpu - refId: A - step: 10 - timeFrom: - timeShift: - title: Pods CPU usage (5m avg) - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: cumulative - transparent: false - type: graph - xaxis: - show: true - yaxes: - - format: none - label: cores - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - showTitle: false - title: Pods CPU usage - - collapse: true - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 3 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - height: '' - id: 24 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: false - min: false - rightSide: true - show: true - sideWidth: - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{image!="",name=~"^k8s_.*",container!="POD",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (container, pod) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: 'pod: {{ pod }} | {{ container }}' - metric: container_cpu - refId: A - step: 10 - - expr: sum (rate (container_cpu_usage_seconds_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, name, image) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: 'docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})' - metric: container_cpu - refId: B - step: 10 - - expr: sum (rate (container_cpu_usage_seconds_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, rkt_container_name) - interval: 10s - intervalFactor: 1 - legendFormat: 'rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}' - metric: container_cpu - refId: C - step: 10 - timeFrom: - timeShift: - title: Containers CPU usage (5m avg) - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: none - label: cores - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Containers CPU usage - - collapse: true - editable: true - height: 500px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 3 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 20 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: false - show: true - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (rate (container_cpu_usage_seconds_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (id) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "{{ id }}" - metric: container_cpu - refId: A - step: 10 - timeFrom: - timeShift: - title: All processes CPU usage (5m avg) - tooltip: - msResolution: true - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: none - label: cores - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - showTitle: false - title: All processes CPU usage - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 25 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (container_memory_working_set_bytes{image!="",kubernetes_io_hostname=~"^$Node$"}) - by (pod) - interval: 10s - intervalFactor: 1 - legendFormat: "{{ pod }}" - metric: container_memory_usage:sort_desc - refId: A - step: 10 - timeFrom: - timeShift: - title: Pods memory usage - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Pods memory usage - - collapse: true - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 27 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (container_memory_working_set_bytes{image!="",name=~"^k8s_.*",container!="POD",kubernetes_io_hostname=~"^$Node$"}) - by (container, pod) - interval: 10s - intervalFactor: 1 - legendFormat: 'pod: {{ pod }} | {{ container }}' - metric: container_memory_usage:sort_desc - refId: A - step: 10 - - expr: sum (container_memory_working_set_bytes{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}) - by (kubernetes_io_hostname, name, image) - interval: 10s - intervalFactor: 1 - legendFormat: 'docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})' - metric: container_memory_usage:sort_desc - refId: B - step: 10 - - expr: sum (container_memory_working_set_bytes{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}) - by (kubernetes_io_hostname, rkt_container_name) - interval: 10s - intervalFactor: 1 - legendFormat: 'rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}' - metric: container_memory_usage:sort_desc - refId: C - step: 10 - timeFrom: - timeShift: - title: Containers memory usage - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Containers memory usage - - collapse: true - editable: true - height: 500px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 0 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 28 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: false - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: true - targets: - - expr: sum (container_memory_working_set_bytes{id!="/",kubernetes_io_hostname=~"^$Node$"}) - by (id) - interval: 10s - intervalFactor: 1 - legendFormat: "{{ id }}" - metric: container_memory_usage:sort_desc - refId: A - step: 10 - timeFrom: - timeShift: - title: All processes memory usage - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: All processes memory usage - - collapse: false - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 16 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum (rate (container_network_receive_bytes_total{image!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (pod) - interval: 10s - intervalFactor: 1 - legendFormat: "-> {{ pod }}" - metric: network - refId: A - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (pod)' - interval: 10s - intervalFactor: 1 - legendFormat: "<- {{ pod }}" - metric: network - refId: B - step: 10 - timeFrom: - timeShift: - title: Pods network I/O (5m avg) - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Pods network I/O - - collapse: true - editable: true - height: 250px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 30 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: true - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum (rate (container_network_receive_bytes_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (container, pod) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "-> pod: {{ pod }} | {{ container }}" - metric: network - refId: B - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",name=~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (container, pod)' - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "<- pod: {{ pod }} | {{ container }}" - metric: network - refId: D - step: 10 - - expr: sum (rate (container_network_receive_bytes_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, name, image) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "-> docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name - }})" - metric: network - refId: A - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{image!="",name!~"^k8s_.*",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, name, image)' - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "<- docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name - }})" - metric: network - refId: C - step: 10 - - expr: sum (rate (container_network_transmit_bytes_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, rkt_container_name) - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "-> rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name - }}" - metric: network - refId: E - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{rkt_container_name!="",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (kubernetes_io_hostname, rkt_container_name)' - hide: false - interval: 10s - intervalFactor: 1 - legendFormat: "<- rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name - }}" - metric: network - refId: F - step: 10 - timeFrom: - timeShift: - title: Containers network I/O (5m avg) - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: Containers network I/O - - collapse: true - editable: true - height: 500px - panels: - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - grid: - threshold1: - threshold1Color: rgba(216, 200, 27, 0.27) - threshold2: - threshold2Color: rgba(234, 112, 112, 0.22) - id: 29 - isNew: true - legend: - alignAsTable: true - avg: true - current: true - max: false - min: false - rightSide: false - show: true - sideWidth: 200 - sort: current - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum (rate (container_network_receive_bytes_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (id) - interval: 10s - intervalFactor: 1 - legendFormat: "-> {{ id }}" - metric: network - refId: A - step: 10 - - expr: '- sum (rate (container_network_transmit_bytes_total{id!="/",kubernetes_io_hostname=~"^$Node$"}[5m])) - by (id)' - interval: 10s - intervalFactor: 1 - legendFormat: "<- {{ id }}" - metric: network - refId: B - step: 10 - timeFrom: - timeShift: - title: All processes network I/O (5m avg) - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - show: true - yaxes: - - format: Bps - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - title: All processes network I/O - time: - from: now-5m - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: ".*" - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: true - multi: false - name: Node - options: [] - query: label_values(kubernetes_io_hostname) - refresh: 1 - type: query - annotations: - list: [] - refresh: 5m - schemaVersion: 12 - version: 13 - links: [] - gnetId: 315 - coredns: - __inputs: - - name: prometheus - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.4.3 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - annotations: - list: [] - editable: true - gnetId: 5926 - graphTooltip: 0 - hideControls: false - id: - links: [] - rows: - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 1 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: total - yaxis: 2 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - by (proto) - format: time_series - intervalFactor: 2 - legendFormat: "{{proto}}" - refId: A - step: 60 - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - format: time_series - intervalFactor: 2 - legendFormat: total - refId: B - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (total) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 12 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: total - yaxis: 2 - - alias: other - yaxis: 2 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_request_type_count_total{instance=~"$instance"}[5m])) - by (type) - intervalFactor: 2 - legendFormat: "{{type}}" - refId: A - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (by qtype) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 2 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: total - yaxis: 2 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - by (zone) - intervalFactor: 2 - legendFormat: "{{zone}}" - refId: A - step: 60 - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - intervalFactor: 2 - legendFormat: total - refId: B - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (by zone) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 10 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: total - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_request_do_count_total{instance=~"$instance"}[5m])) - intervalFactor: 2 - legendFormat: DO - refId: A - step: 40 - - expr: sum(rate(coredns_dns_request_count_total{instance=~"$instance"}[5m])) - intervalFactor: 2 - legendFormat: total - refId: B - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Requests (DO bit) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 9 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: tcp:90 - yaxis: 2 - - alias: 'tcp:99 ' - yaxis: 2 - - alias: tcp:50 - yaxis: 2 - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:99 " - refId: A - step: 60 - - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:90" - refId: B - step: 60 - - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:50" - refId: C - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (size, udp) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 14 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: tcp:90 - yaxis: 1 - - alias: 'tcp:99 ' - yaxis: 1 - - alias: tcp:50 - yaxis: 1 - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:99 " - refId: A - step: 60 - - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:90" - refId: B - step: 60 - - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) - intervalFactor: 2 - legendFormat: "{{proto}}:50" - refId: C - step: 60 - thresholds: [] - timeFrom: - timeShift: - title: Requests (size,tcp) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Row - titleSize: h6 - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 5 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_dns_response_rcode_count_total{instance=~"$instance"}[5m])) - by (rcode) - intervalFactor: 2 - legendFormat: "{{rcode}}" - refId: A - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Responses (by rcode) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: histogram_quantile(0.99, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m])) - by (le, job)) - intervalFactor: 2 - legendFormat: 99% - refId: A - step: 40 - - expr: histogram_quantile(0.90, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m])) - by (le)) - intervalFactor: 2 - legendFormat: 90% - refId: B - step: 40 - - expr: histogram_quantile(0.50, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~"$instance"}[5m])) - by (le)) - intervalFactor: 2 - legendFormat: 50% - refId: C - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Responses (duration) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 8 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: udp:50% - yaxis: 1 - - alias: tcp:50% - yaxis: 2 - - alias: tcp:90% - yaxis: 2 - - alias: tcp:99% - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: 'histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:99%" - refId: A - step: 40 - - expr: 'histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance="$instance",proto="udp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:90%" - refId: B - step: 40 - - expr: 'histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="udp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:50%" - metric: '' - refId: C - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Responses (size, udp) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 13 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: udp:50% - yaxis: 1 - - alias: tcp:50% - yaxis: 1 - - alias: tcp:90% - yaxis: 1 - - alias: tcp:99% - yaxis: 1 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: 'histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:99%" - refId: A - step: 40 - - expr: 'histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le,proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:90%" - refId: B - step: 40 - - expr: 'histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~"$instance",proto="tcp"}[5m])) - by (le, proto)) ' - intervalFactor: 2 - legendFormat: "{{proto}}:50%" - metric: '' - refId: C - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Responses (size, tcp) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 15 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(coredns_cache_size{instance=~"$instance"}) by (type) - intervalFactor: 2 - legendFormat: "{{type}}" - refId: A - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Cache (size) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 16 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: misses - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(coredns_cache_hits_total{instance=~"$instance"}[5m])) by (type) - intervalFactor: 2 - legendFormat: hits:{{type}} - refId: A - step: 40 - - expr: sum(rate(coredns_cache_misses_total{instance=~"$instance"}[5m])) by (type) - intervalFactor: 2 - legendFormat: misses - refId: B - step: 40 - thresholds: [] - timeFrom: - timeShift: - title: Cache (hitrate) - tooltip: - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: pps - logBase: 1 - max: - min: 0 - show: true - - format: pps - logBase: 1 - max: - min: 0 - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: - - dns - - coredns - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: ".*" - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: true - label: Instance - multi: false - name: instance - options: [] - query: up{job="coredns"} - refresh: 1 - regex: .*instance="(.*?)".* - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - time: - from: now-3h - to: now - timepicker: - now: true - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: utc - title: CoreDNS - version: 3 - description: A dashboard for the CoreDNS DNS server. - elasticsearch: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.6.3 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: - - builtIn: 1 - datasource: "-- Grafana --" - enable: true - hide: true - iconColor: rgba(0, 211, 255, 1) - name: Annotations & Alerts - type: dashboard - editable: true - gnetId: 4358 - graphTooltip: 1 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(178, 49, 13, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 8 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 5 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: (sum(elasticsearch_cluster_health_status{cluster=~"$cluster",color="green"})*2)+sum(elasticsearch_cluster_health_status{cluster=~"$cluster",color="yellow"}) - format: time_series - intervalFactor: 3 - legendFormat: '' - metric: '' - refId: A - step: 40 - thresholds: '0,1,2' - title: Cluster health status - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: GREEN - value: '2' - - op: "=" - text: YELLOW - value: '1' - - op: "=" - text: RED - value: '0' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 10 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: sum(elasticsearch_cluster_health_number_of_nodes{cluster=~"$cluster"}) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - metric: '' - refId: A - step: 40 - thresholds: '' - title: Nodes - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 9 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_number_of_data_nodes{cluster="$cluster"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - metric: '' - refId: A - step: 40 - thresholds: '' - title: Data nodes - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - hideTimeOverride: true - id: 16 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_number_of_pending_tasks{cluster="$cluster"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - metric: '' - refId: A - step: 40 - thresholds: '' - title: Pending tasks - transparent: false - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Cluster - titleSize: h6 - - collapse: false - height: '' - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 11 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - repeat: shard_type - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_active_primary_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: active primary shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 39 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_active_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: active shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 40 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_initializing_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: initializing shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 41 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_relocating_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: relocating shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - height: '50' - id: 42 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - minSpan: 2 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2.4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: true - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: elasticsearch_cluster_health_unassigned_shards{cluster="$cluster"} - intervalFactor: 2 - legendFormat: '' - refId: A - step: 40 - thresholds: '' - title: unassigned shards - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Shards - titleSize: h6 - - collapse: false - height: - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 30 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: elasticsearch_process_cpu_percent{cluster="$cluster",es_master_node="true",name=~"$node"} - format: time_series - instant: false - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - master" - metric: '' - refId: A - step: 10 - - expr: elasticsearch_process_cpu_percent{cluster="$cluster",es_data_node="true",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - data" - metric: '' - refId: B - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: CPU usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percent - label: CPU usage - logBase: 1 - max: 100 - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 0 - grid: {} - height: '400' - id: 31 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: elasticsearch_jvm_memory_used_bytes{cluster="$cluster",name=~"$node",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - used: {{area}}" - metric: '' - refId: A - step: 10 - - expr: elasticsearch_jvm_memory_committed_bytes{cluster="$cluster",name=~"$node",name=~"$node"} - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - committed: {{area}}" - refId: B - step: 10 - - expr: elasticsearch_jvm_memory_max_bytes{cluster="$cluster",name=~"$node",name=~"$node"} - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - max: {{area}}" - refId: C - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: JVM memory usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: Memory - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 32 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: 1-(elasticsearch_filesystem_data_available_bytes{cluster="$cluster"}/elasticsearch_filesystem_data_size_bytes{cluster="$cluster",name=~"$node"}) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - {{path}}" - metric: '' - refId: A - step: 10 - thresholds: - - colorMode: custom - fill: true - fillColor: rgba(216, 200, 27, 0.27) - op: gt - value: 0.8 - - colorMode: custom - fill: true - fillColor: rgba(234, 112, 112, 0.22) - op: gt - value: 0.9 - timeFrom: - timeShift: - title: Disk usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percentunit - label: Disk Usage % - logBase: 1 - max: 1 - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 47 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sort: max - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: sent - transform: negative-Y - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: irate(elasticsearch_transport_tx_size_bytes_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} -sent" - refId: D - step: 10 - - expr: irate(elasticsearch_transport_rx_size_bytes_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} -received" - refId: C - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Network usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: Bps - label: Bytes/sec - logBase: 1 - max: - min: - show: true - - format: pps - label: '' - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: System - titleSize: h6 - - collapse: false - height: '' - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 1 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: elasticsearch_indices_docs{cluster="$cluster",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Documents count - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Documents - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 24 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: irate(elasticsearch_indices_indexing_index_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Documents indexed rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: index calls/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 25 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_docs_deleted{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Documents deleted rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Documents/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 26 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_merges_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Documents merged rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Documents/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Documents - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 48 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: irate(elasticsearch_indices_indexing_index_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - indexing" - metric: '' - refId: A - step: 4 - - expr: irate(elasticsearch_indices_search_query_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - query" - refId: B - step: 4 - - expr: irate(elasticsearch_indices_search_fetch_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - fetch" - refId: C - step: 4 - - expr: irate(elasticsearch_indices_merges_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - merges" - refId: D - step: 4 - - expr: irate(elasticsearch_indices_refresh_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - refresh" - refId: E - step: 4 - - expr: irate(elasticsearch_indices_flush_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - flush" - refId: F - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Total Operations rate - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Operations/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 49 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: irate(elasticsearch_indices_indexing_index_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ name }} - indexing" - metric: '' - refId: A - step: 4 - - expr: irate(elasticsearch_indices_search_query_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - query" - refId: B - step: 4 - - expr: irate(elasticsearch_indices_search_fetch_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - fetch" - refId: C - step: 4 - - expr: irate(elasticsearch_indices_merges_total_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - merges" - refId: D - step: 4 - - expr: irate(elasticsearch_indices_refresh_total_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - refresh" - refId: E - step: 4 - - expr: irate(elasticsearch_indices_flush_time_ms_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{ name }} - flush" - refId: F - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Total Operations time - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: ms - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Total Operations stats - titleSize: h6 - - collapse: false - height: '' - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 33 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: 'rate(elasticsearch_indices_search_query_time_seconds{cluster="$cluster",name=~"$node"}[$interval]) ' - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Query time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: ms - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 5 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_indexing_index_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Indexing time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: ms - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 3 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_merges_total_time_seconds_total{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: Merging time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Times - titleSize: h6 - - collapse: false - height: - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 4 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: elasticsearch_indices_fielddata_memory_size_bytes{cluster="$cluster",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Field data memory size - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: Memory - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 34 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_fielddata_evictions{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Field data evictions - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Evictions/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 35 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: elasticsearch_indices_query_cache_memory_size_bytes{cluster="$cluster",name=~"$node"} - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Query cache size - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: Size - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 36 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_indices_query_cache_evictions{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}}" - metric: '' - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Query cache evictions - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: Evictions/s - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Caches - titleSize: h6 - - collapse: false - height: 728 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 45 - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: ' irate(elasticsearch_thread_pool_rejected_count{cluster="$cluster",name=~"$node"}[$interval])' - format: time_series - intervalFactor: 2 - legendFormat: "{{name}} - {{ type }}" - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Thread Pool operations rejected - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 46 - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: elasticsearch_thread_pool_active_count{cluster="$cluster",name=~"$node"} - format: time_series - intervalFactor: 2 - legendFormat: "{{name}} - {{ type }}" - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Thread Pool operations queued - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - height: '' - id: 43 - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: elasticsearch_thread_pool_active_count{cluster="$cluster",name=~"$node"} - format: time_series - intervalFactor: 2 - legendFormat: "{{name}} - {{ type }}" - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Thread Pool threads active - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 44 - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sort: avg - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: irate(elasticsearch_thread_pool_completed_count{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - intervalFactor: 2 - legendFormat: "{{name}} - {{ type }}" - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Thread Pool operations completed - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Thread Pool - titleSize: h6 - - collapse: false - height: - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 7 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: true - steppedLine: false - targets: - - expr: rate(elasticsearch_jvm_gc_collection_seconds_count{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}} - {{gc}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: GC count - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: GCs - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - height: '400' - id: 27 - legend: - alignAsTable: true - avg: true - current: true - hideEmpty: false - hideZero: false - max: true - min: true - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: rate(elasticsearch_jvm_gc_collection_seconds_count{cluster="$cluster",name=~"$node"}[$interval]) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{name}} - {{gc}}" - metric: '' - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: GC time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - transparent: false - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: Time - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: JVM Garbage Collection - titleSize: h6 - schemaVersion: 14 - style: dark - tags: - - elasticsearch - - App - templating: - list: - - auto: true - auto_count: 30 - auto_min: 10s - current: - text: auto - value: "$__auto_interval" - hide: 0 - label: Interval - name: interval - options: - - selected: true - text: auto - value: "$__auto_interval" - - selected: false - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 2 - type: interval - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Instance - multi: false - name: cluster - options: [] - query: label_values(elasticsearch_cluster_health_status,cluster) - refresh: 1 - regex: '' - sort: 1 - tagValuesQuery: - tags: [] - tagsQuery: - type: query - useTags: false - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: true - label: node - multi: true - name: node - options: [] - query: label_values(elasticsearch_process_cpu_percent,name) - refresh: 1 - regex: '' - sort: 1 - tagValuesQuery: - tags: [] - tagsQuery: - type: query - useTags: false - time: - from: now-12h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Elasticsearch - version: 1 - description: Elasticsearch detailed dashboard - kubernetes_capacity_planning: - __inputs: - - name: DS_PROMETHEUS - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.4.1 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: [] - description: '' - editable: true - gnetId: 22 - graphTooltip: 0 - hideControls: false - id: - links: [] - refresh: false - rows: - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(node_cpu{mode="idle"}[2m])) * 100 - hide: false - intervalFactor: 10 - legendFormat: '' - refId: A - step: 50 - thresholds: [] - timeFrom: - timeShift: - title: Idle cpu - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percent - label: cpu usage - logBase: 1 - max: - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 9 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(node_load1) - intervalFactor: 4 - legendFormat: load 1m - refId: A - step: 20 - target: '' - - expr: sum(node_load5) - intervalFactor: 4 - legendFormat: load 5m - refId: B - step: 20 - target: '' - - expr: sum(node_load15) - intervalFactor: 4 - legendFormat: load 15m - refId: C - step: 20 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: System load - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percentunit - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 4 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: node_memory_SwapFree{instance="172.17.0.1:9100",job="prometheus"} - yaxis: 2 - spaceLength: 10 - span: 9 - stack: true - steppedLine: false - targets: - - expr: sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - - sum(node_memory_Cached) - intervalFactor: 2 - legendFormat: memory usage - metric: memo - refId: A - step: 10 - target: '' - - expr: sum(node_memory_Buffers) - interval: '' - intervalFactor: 2 - legendFormat: memory buffers - metric: memo - refId: B - step: 10 - target: '' - - expr: sum(node_memory_Cached) - interval: '' - intervalFactor: 2 - legendFormat: memory cached - metric: memo - refId: C - step: 10 - target: '' - - expr: sum(node_memory_MemFree) - interval: '' - intervalFactor: 2 - legendFormat: memory free - metric: memo - refId: D - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Memory usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 5 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: "((sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - - sum(node_memory_Cached)) / sum(node_memory_MemTotal)) * 100" - intervalFactor: 2 - metric: '' - refId: A - step: 60 - target: '' - thresholds: 80, 90 - title: Memory usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 246 - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 6 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: read - yaxis: 1 - - alias: '{instance="172.17.0.1:9100"}' - yaxis: 2 - - alias: io time - yaxis: 2 - spaceLength: 10 - span: 9 - stack: false - steppedLine: false - targets: - - expr: sum(rate(node_disk_bytes_read[5m])) - hide: false - intervalFactor: 4 - legendFormat: read - refId: A - step: 20 - target: '' - - expr: sum(rate(node_disk_bytes_written[5m])) - intervalFactor: 4 - legendFormat: written - refId: B - step: 20 - - expr: sum(rate(node_disk_io_time_ms[5m])) - intervalFactor: 4 - legendFormat: io time - refId: C - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Disk I/O - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: ms - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percentunit - gauge: - maxValue: 1 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 12 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(node_filesystem_size{device!="rootfs"}) - sum(node_filesystem_free{device!="rootfs"})) - / sum(node_filesystem_size{device!="rootfs"}) - intervalFactor: 2 - refId: A - step: 60 - target: '' - thresholds: 0.75, 0.9 - title: Disk space usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 8 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: 'transmitted ' - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(node_network_receive_bytes{device!~"lo"}[5m])) - hide: false - intervalFactor: 2 - legendFormat: '' - refId: A - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Network received - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 10 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: 'transmitted ' - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(rate(node_network_transmit_bytes{device!~"lo"}[5m])) - hide: false - intervalFactor: 2 - legendFormat: '' - refId: B - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Network transmitted - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: bytes - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 276 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 11 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 9 - stack: false - steppedLine: false - targets: - - expr: sum(kube_pod_info) - format: time_series - intervalFactor: 2 - legendFormat: Current number of Pods - refId: A - step: 10 - - expr: sum(kube_node_status_capacity_pods) - format: time_series - intervalFactor: 2 - legendFormat: Maximum capacity of pods - refId: B - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Cluster Pod Utilization - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 7 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: 100 - (sum(kube_node_status_capacity_pods) - sum(kube_pod_info)) / sum(kube_node_status_capacity_pods) - * 100 - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 60 - target: '' - thresholds: '80,90' - title: Pod Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Kubernetes Capacity Planning - version: 4 - inputs: - - name: prometheus - pluginId: prometheus - type: datasource - value: prometheus - overwrite: true - kubernetes_cluster_status: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.4.1 - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: [] - editable: true - gnetId: - graphTooltip: 0 - hideControls: false - id: - links: [] - rows: - - collapse: false - height: 129 - panels: - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 5 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 6 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: sum(up{job=~"apiserver|kube-scheduler|kube-controller-manager"} == 0) - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '1,3' - title: Control Plane UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: UP - value: 'null' - valueName: total - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 6 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 6 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: sum(ALERTS{alertstate="firing",alertname!="DeadMansSwitch"}) - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '3,5' - title: Alerts Firing - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: '0' - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Cluster Health - titleSize: h6 - - collapse: false - height: 168 - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - decimals: - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 1 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(up{job="apiserver"} == 1) / count(up{job="apiserver"})) * 100 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '50,80' - title: API Servers UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - decimals: - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 2 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(up{job="kube-controller-manager-discovery"} == 1) / count(up{job="kube-controller-manager-discovery"})) - * 100 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '50,80' - title: Controller Managers UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(245, 54, 54, 0.9) - - rgba(237, 129, 40, 0.89) - - rgba(50, 172, 45, 0.97) - datasource: "${DS_PROMETHEUS}" - decimals: - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 3 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(up{job="kube-scheduler-discovery"} == 1) / count(up{job="kube-scheduler-discovery"})) - * 100 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '50,80' - title: Schedulers UP - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - decimals: - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - hideTimeOverride: false - id: 4 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: count(increase(kube_pod_container_status_restarts{namespace=~"kube-system|tectonic-system"}[1h]) - > 5) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '1,3' - title: Crashlooping Control Plane Pods - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: '0' - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Control Plane Status - titleSize: h6 - - collapse: false - height: 158 - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 8 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: sum(100 - (avg by (instance) (rate(node_cpu{job="node-exporter",mode="idle"}[5m])) - * 100)) / count(node_cpu{job="node-exporter",mode="idle"}) - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '80,90' - title: CPU Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 7 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: "((sum(node_memory_MemTotal) - sum(node_memory_MemFree) - sum(node_memory_Buffers) - - sum(node_memory_Cached)) / sum(node_memory_MemTotal)) * 100" - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '80,90' - title: Memory Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 9 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(node_filesystem_size{device!="rootfs"}) - sum(node_filesystem_free{device!="rootfs"})) - / sum(node_filesystem_size{device!="rootfs"}) - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '80,90' - title: Filesystem Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 10 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: 100 - (sum(kube_node_status_capacity_pods) - sum(kube_pod_info)) / sum(kube_node_status_capacity_pods) - * 100 - format: time_series - intervalFactor: 2 - legendFormat: '' - refId: A - step: 600 - thresholds: '80,90' - title: Pod Utilization - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Capacity Planing - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - time: - from: now-6h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: '' - title: Kubernetes Cluster Status - version: 3 - inputs: - - name: prometheus - pluginId: prometheus - type: datasource - value: prometheus - overwrite: true - nginx_stats: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.5.2 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - annotations: - list: [] - description: Show stats from the hnlq715/nginx-vts-exporter. - editable: true - gnetId: 2949 - graphTooltip: 0 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 7 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum(nginx_upstream_responses_total{upstream=~"^$Upstream$"}) by (status_code, - upstream) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ status_code }}.{{ upstream }}" - metric: nginx_upstream_response - refId: A - step: 4 - thresholds: [] - timeFrom: - timeShift: - title: HTTP Response Codes by Upstream - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 6 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_upstream_requests_total{upstream=~"^$Upstream$"}[5m])) - by (upstream) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ upstream }}" - metric: nginx_upstream_requests - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Upstream Requests rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 5 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_upstream_bytes_total{upstream=~"^$Upstream$"}[5m])) by - (direction, upstream) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ direction }}.{{ upstream }}" - metric: nginx_upstream_bytes - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Upstream Bytes Transfer rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 1 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_connections_total[5m])) by (type) - format: time_series - intervalFactor: 2 - legendFormat: "{{ type }}" - metric: nginx_server_connections - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Overall Connections rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 4 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_cache_total{ server_zone=~"$ingress"}[5m])) by (server_zone, - type) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ type }}.{{ server_zone }}" - metric: nginx_server_cache - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Cache Action rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_requests_total{ server_zone=~"$ingress" }[5m])) by (server_zone) - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: "{{ server_zone }}" - metric: nginx_server_requests - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Overall Requests rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 2 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(irate(nginx_bytes_total{ server_zone=~"$ingress" }[5m])) by (direction, - server_zone) - format: time_series - intervalFactor: 2 - legendFormat: "{{ direction }}.{{ server_zone }}" - metric: nginx_server_bytes - refId: A - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Overall Bytes Transferred rate - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: - - prometheus - - nginx - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: ".*" - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: - multi: true - name: Upstream - options: [] - query: label_values(nginx_upstream_bytes_total, upstream) - refresh: 1 - regex: '' - sort: 1 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: - multi: true - name: ingress - options: [] - query: label_values(nginx_bytes_total, server_zone) - refresh: 1 - regex: "/^[^\\*_]+$/" - sort: 1 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Nginx Stats - version: 13 - nodes: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.4.1 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: [] - description: Dashboard to get an overview of one server - editable: true - gnetId: 22 - graphTooltip: 0 - hideControls: false - id: - links: [] - refresh: false - rows: - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: 100 - (avg by (cpu) (irate(node_cpu{mode="idle", instance="$server"}[5m])) - * 100) - hide: false - intervalFactor: 10 - legendFormat: "{{cpu}}" - refId: A - step: 50 - thresholds: [] - timeFrom: - timeShift: - title: Idle cpu - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percent - label: cpu usage - logBase: 1 - max: 100 - min: 0 - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 9 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: node_load1{instance="$server"} - intervalFactor: 4 - legendFormat: load 1m - refId: A - step: 20 - target: '' - - expr: node_load5{instance="$server"} - intervalFactor: 4 - legendFormat: load 5m - refId: B - step: 20 - target: '' - - expr: node_load15{instance="$server"} - intervalFactor: 4 - legendFormat: load 15m - refId: C - step: 20 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: System load - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: percentunit - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 4 - legend: - alignAsTable: false - avg: false - current: false - hideEmpty: false - hideZero: false - max: false - min: false - rightSide: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: node_memory_SwapFree{instance="172.17.0.1:9100",job="prometheus"} - yaxis: 2 - spaceLength: 10 - span: 9 - stack: true - steppedLine: false - targets: - - expr: node_memory_MemTotal{instance="$server"} - node_memory_MemFree{instance="$server"} - - node_memory_Buffers{instance="$server"} - node_memory_Cached{instance="$server"} - hide: false - interval: '' - intervalFactor: 2 - legendFormat: memory used - metric: '' - refId: C - step: 10 - - expr: node_memory_Buffers{instance="$server"} - interval: '' - intervalFactor: 2 - legendFormat: memory buffers - metric: '' - refId: E - step: 10 - - expr: node_memory_Cached{instance="$server"} - intervalFactor: 2 - legendFormat: memory cached - metric: '' - refId: F - step: 10 - - expr: node_memory_MemFree{instance="$server"} - intervalFactor: 2 - legendFormat: memory free - metric: '' - refId: D - step: 10 - thresholds: [] - timeFrom: - timeShift: - title: Memory usage - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percent - gauge: - maxValue: 100 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 5 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: ((node_memory_MemTotal{instance="$server"} - node_memory_MemFree{instance="$server"} - - node_memory_Buffers{instance="$server"} - node_memory_Cached{instance="$server"}) - / node_memory_MemTotal{instance="$server"}) * 100 - intervalFactor: 2 - refId: A - step: 60 - target: '' - thresholds: 80, 90 - title: Memory usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 6 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: read - yaxis: 1 - - alias: '{instance="172.17.0.1:9100"}' - yaxis: 2 - - alias: io time - yaxis: 2 - spaceLength: 10 - span: 9 - stack: false - steppedLine: false - targets: - - expr: sum by (instance) (rate(node_disk_bytes_read{instance="$server"}[2m])) - hide: false - intervalFactor: 4 - legendFormat: read - refId: A - step: 20 - target: '' - - expr: sum by (instance) (rate(node_disk_bytes_written{instance="$server"}[2m])) - intervalFactor: 4 - legendFormat: written - refId: B - step: 20 - - expr: sum by (instance) (rate(node_disk_io_time_ms{instance="$server"}[2m])) - intervalFactor: 4 - legendFormat: io time - refId: C - step: 20 - thresholds: [] - timeFrom: - timeShift: - title: Disk I/O - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: ms - label: - logBase: 1 - max: - min: - show: true - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: percentunit - gauge: - maxValue: 1 - minValue: 0 - show: true - thresholdLabels: false - thresholdMarkers: true - id: 7 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: (sum(node_filesystem_size{device!="rootfs",instance="$server"}) - sum(node_filesystem_free{device!="rootfs",instance="$server"})) - / sum(node_filesystem_size{device!="rootfs",instance="$server"}) - intervalFactor: 2 - refId: A - step: 60 - target: '' - thresholds: 0.75, 0.9 - title: Disk space usage - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - - collapse: false - height: 250px - panels: - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 8 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: 'transmitted ' - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: rate(node_network_receive_bytes{instance="$server",device!~"lo"}[5m]) - hide: false - intervalFactor: 2 - legendFormat: "{{device}}" - refId: A - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Network received - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - alerting: {} - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 10 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: 'transmitted ' - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: rate(node_network_transmit_bytes{instance="$server",device!~"lo"}[5m]) - hide: false - intervalFactor: 2 - legendFormat: "{{device}}" - refId: B - step: 10 - target: '' - thresholds: [] - timeFrom: - timeShift: - title: Network transmitted - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: - show: true - - format: bytes - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: New row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Server - multi: false - name: host - options: [] - query: label_values(node_uname_info, nodename) - refresh: 1 - regex: '' - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 2 - includeAll: false - label: Instance - multi: false - name: server - options: [] - query: label_values(node_uname_info{nodename="$host"}, instance) - refresh: 1 - regex: '' - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - time: - from: now-1h - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Nodes - version: 2 - inputs: - - name: prometheus - pluginId: prometheus - type: datasource - value: prometheus - overwrite: true - rabbitmq: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.2.0 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - list: [] - editable: true - gnetId: 2121 - graphTooltip: 0 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: 266 - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(50, 172, 45, 0.97) - - rgba(237, 129, 40, 0.89) - - rgba(245, 54, 54, 0.9) - datasource: "${DS_PROMETHEUS}" - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 13 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 3 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - targets: - - expr: rabbitmq_up{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - metric: rabbitmq_up{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - refId: A - step: 2 - thresholds: Up,Down - timeFrom: 30s - title: RabbitMQ Server - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - - op: "=" - text: Down - value: '0' - - op: "=" - text: Up - value: '1' - valueName: current - - alert: - conditions: - - evaluator: - params: - - 1 - type: lt - operator: - type: and - query: - params: - - A - - 10s - - now - reducer: - params: [] - type: last - type: query - - evaluator: - params: [] - type: no_value - operator: - type: and - query: - params: - - A - - 10s - - now - reducer: - params: [] - type: last - type: query - executionErrorState: alerting - frequency: 60s - handler: 1 - message: Some of the RabbitMQ node is down - name: Node Stats alert - noDataState: no_data - notifications: [] - aliasColors: {} - bars: true - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 12 - legend: - alignAsTable: true - avg: false - current: true - max: false - min: false - show: true - total: false - values: true - lines: false - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 9 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_running{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}" - metric: rabbitmq_running - refId: A - step: 2 - thresholds: - - colorMode: critical - fill: true - line: true - op: lt - value: 1 - timeFrom: 30s - timeShift: - title: Node up Stats - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 6 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_exchangesTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:exchanges" - metric: rabbitmq_exchangesTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Exchanges - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 4 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_channelsTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:channels" - metric: rabbitmq_channelsTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Channels - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 3 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_consumersTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:consumers" - metric: rabbitmq_consumersTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Consumers - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 5 - legend: - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_connectionsTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:connections" - metric: rabbitmq_connectionsTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Connections - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 7 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 4 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_queuesTotal{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{instance}}:queues" - metric: rabbitmq_queuesTotal - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Queues - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 8 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum by (vhost)(rabbitmq_queue_messages_ready{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}) - intervalFactor: 2 - legendFormat: "{{vhost}}:ready" - metric: rabbitmq_queue_messages_ready - refId: A - step: 2 - - expr: sum by (vhost)(rabbitmq_queue_messages_published_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}) - intervalFactor: 2 - legendFormat: "{{vhost}}:published" - metric: rabbitmq_queue_messages_published_total - refId: B - step: 2 - - expr: sum by (vhost)(rabbitmq_queue_messages_delivered_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}) - intervalFactor: 2 - legendFormat: "{{vhost}}:delivered" - metric: rabbitmq_queue_messages_delivered_total - refId: C - step: 2 - - expr: sum by (vhost)(rabbitmq_queue_messages_unacknowledged{application="prometheus_rabbitmq_exporter",release_group="$rabbit"}) - intervalFactor: 2 - legendFormat: "{{vhost}}:unack" - metric: ack - refId: D - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Messages/host - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - decimals: 0 - fill: 1 - id: 2 - legend: - alignAsTable: true - avg: false - current: true - max: false - min: false - rightSide: false - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_queue_messages{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{queue}}:{{durable}}" - metric: rabbitmq_queue_messages - refId: A - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Messages / Queue - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 9 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_node_mem_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:used" - metric: rabbitmq_node_mem_used - refId: A - step: 2 - - expr: rabbitmq_node_mem_limit{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:limit" - metric: node_mem - refId: B - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Memory - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: decbytes - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 10 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_fd_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:used" - metric: '' - refId: A - step: 2 - - expr: rabbitmq_fd_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:total" - metric: node_mem - refId: B - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: FIle descriptors - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 11 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - span: 6 - stack: false - steppedLine: false - targets: - - expr: rabbitmq_sockets_used{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:used" - metric: '' - refId: A - step: 2 - - expr: rabbitmq_sockets_total{application="prometheus_rabbitmq_exporter",release_group="$rabbit"} - intervalFactor: 2 - legendFormat: "{{node}}:total" - metric: '' - refId: B - step: 2 - thresholds: [] - timeFrom: - timeShift: - title: Sockets - tooltip: - shared: true - sort: 0 - value_type: individual - transparent: false - type: graph - xaxis: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Dashboard Row - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: {} - hide: 0 - label: null - name: rabbit - options: [] - type: query - query: label_values(rabbitmq_up, release_group) - refresh: 1 - sort: 1 - datasource: "${DS_PROMETHEUS}" - time: - from: now-5m - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: RabbitMQ Metrics - version: 17 - description: 'Basic rabbitmq host stats: Node Stats, Exchanges, Channels, Consumers, Connections, - Queues, Messages, Messages per Queue, Memory, File Descriptors, Sockets.' - openstack_control_plane: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.5.2 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: panel - id: text - name: Text - version: '' - annotations: - list: [] - editable: true - gnetId: - graphTooltip: 1 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: 250px - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 24 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=keystone - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_keystone_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Keystone - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 23 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=glance - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_glance_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Glance - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(202, 58, 40, 0.86) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 22 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=heat - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_heat_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Heat - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 21 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=neutron - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_neutron_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Neutron - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 20 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=nova - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_nova_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Nova - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 19 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=swift - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_swift_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Ceph - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 18 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=cinder - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_cinder_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Cinder - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 17 - interval: "> 60s" - links: - - dashboard: Openstack Service - name: Drilldown dashboard - params: var-Service=placement - title: Openstack Service - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_placement_api{job="openstack-metrics", region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Placement - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 16 - interval: "> 60s" - links: - - dashboard: RabbitMQ Metrics - name: Drilldown dashboard - title: RabbitMQ Metrics - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: min(rabbitmq_up) - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: RabbitMQ - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 15 - interval: "> 60s" - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: min(mysql_global_status_wsrep_ready) - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: MariaDB - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(225, 177, 40, 0.59) - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 14 - interval: "> 60s" - links: - - dashboard: Nginx Stats - name: Drilldown dashboard - title: Nginx Stats - type: dashboard - mappingType: 2 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: '1' - text: OK - to: '99999999999999' - - from: '0' - text: CRIT - to: '0' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: sum_over_time(nginx_connections_total{type="active", namespace="openstack"}[5m]) - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '0,1' - title: Nginx - type: singlestat - valueFontSize: 50% - valueName: current - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(208, 53, 34, 0.82) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 13 - interval: "> 60s" - links: - - dashboard: Memcached - name: Drilldown dashboard - title: Memcached - type: dashboard - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: min(memcached_up) - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '1,2' - title: Memcached - type: singlestat - valueFontSize: 50% - valueMaps: - - op: "=" - text: no data - value: 'null' - - op: "=" - text: CRIT - value: '0' - - op: "=" - text: OK - value: '1' - - op: "=" - text: UNKW - value: '2' - valueName: current - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: OpenStack Services - titleSize: h6 - - collapse: false - height: 250px - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 11 - interval: "> 60s" - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 3 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - alias: free - column: value - expr: openstack_total_used_vcpus{job="openstack-metrics", region="$region"} + openstack_total_free_vcpus{job="openstack-metrics", - region="$region"} - format: time_series - function: min - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - - alias: used - column: value - expr: openstack_total_used_vcpus{job="openstack-metrics", region="$region"} - format: time_series - function: max - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: B - resultFormat: time_series - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: VCPUs (total vs used) - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 12 - interval: "> 60s" - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 3 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - alias: free - column: value - expr: openstack_total_used_ram_MB{job="openstack-metrics", region="$region"} + openstack_total_free_ram_MB{job="openstack-metrics", - region="$region"} - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - - alias: used - column: value - expr: openstack_total_used_ram_MB{job="openstack-metrics", region="$region"} - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: B - resultFormat: time_series - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: RAM (total vs used) - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: mbytes - label: '' - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 13 - interval: "> 60s" - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 3 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - alias: free - column: value - expr: openstack_total_used_disk_GB{job="openstack-metrics", region="$region"} + openstack_total_free_disk_GB{job="openstack-metrics", - region="$region"} - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - - alias: used - column: value - expr: openstack_total_used_disk_GB{job="openstack-metrics", region="$region"} - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: B - resultFormat: time_series - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: Disk (used vs total) - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: gbytes - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes": false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 27 - interval: "> 60s" - legend: - alignAsTable: false - avg: true - current: true - hideEmpty: true - hideZero: false - max: true - min: true - show: true - total: false - values: true - lines: true - linewidth: 4 - links: [] - nullPointMode: null - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - stack: false - steppedLine: false - targets: - - alias: free - column: value - expr: sum(openstack_running_instances) - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - interval: "15s" - intervalFactor: 1 - legendFormat: "{{ running_vms }}" - policy: default - rawQuery: false - refID: A - resultFormat: time_series - - alias: used - column: value - expr: sum(openstack_total_running_instances) - format: time_series - function: mean - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - interval: "15s" - intervalFactor: 1 - legendFormat: "{{ total_vms }}" - policy: default - rawQuery: false - refID: B - resultFormat: time_series - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: OpenStack Instances - tooltip: - msResolution: false - shared: true - sort : 0 - value_type: cumulative - transparent: true - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: none - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: false - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Virtual resources - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - enable: true - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: - multi: false - name: region - options: [] - query: label_values(openstack_exporter_cache_refresh_duration_seconds, region) - refresh: 1 - regex: '' - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - time: - from: now-1h - to: now - timepicker: - collapse: false - enable: true - notice: false - now: true - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - status: Stable - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - type: timepicker - timezone: browser - title: OpenStack Metrics - version: 2 - openstack-service: - __inputs: - - name: prometheus - label: prometheus - description: '' - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.5.2 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - annotations: - enable: true - list: [] - editable: true - gnetId: - graphTooltip: 1 - hideControls: false - id: - links: [] - refresh: 5m - rows: - - collapse: false - height: 250px - panels: - - cacheTimeout: - colorBackground: true - colorValue: false - colors: - - rgba(225, 177, 40, 0.59) - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 6 - interval: "> 60s" - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - column: value - condition: '' - expr: openstack_check_[[Service]]_api{job="openstack-metrics",region="$region"} - fill: '' - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - 'null' - type: fill - groupByTags: [] - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - thresholds: '0,1' - title: '' - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: CRITICAL - value: '0' - - op: "=" - text: OK - value: '1' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - rgba(200, 54, 35, 0.88) - - rgba(118, 245, 40, 0.73) - - rgba(225, 177, 40, 0.59) - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 13 - interval: "> 60s" - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - column: value - condition: '' - expr: sum(nginx_responses_total{server_zone=~"[[Service]].*", status_code="5xx",region="$region"}) - fill: '' - format: time_series - function: count - groupBy: - - interval: auto - params: - - auto - type: time - - params: - - '0' - type: fill - groupby_field: '' - interval: '' - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - step: 120 - tags: [] - thresholds: '' - title: HTTP 5xx errors - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: '0' - value: 'null' - valueName: current - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 0 - grid: {} - id: 7 - interval: ">60s" - legend: - alignAsTable: true - avg: true - current: false - max: true - min: true - show: true - sortDesc: true - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 8 - stack: false - steppedLine: false - targets: - - expr: sum(nginx_upstream_response_msecs_avg{upstream=~"openstack-[[Service]].*",region="$region"}) - by (upstream) - format: time_series - intervalFactor: 2 - refId: A - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: HTTP response time - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: 0 - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - grid: {} - id: 9 - interval: "> 60s" - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: true - targets: - - alias: healthy - column: value - expr: openstack_check_[[Service]]_api{region="$region"} - format: time_series - function: last - groupBy: - - params: - - "$interval" - type: time - - params: - - '0' - type: fill - groupByTags: [] - intervalFactor: 2 - policy: default - rawQuery: false - refId: A - resultFormat: time_series - select: [] - step: 120 - tags: [] - thresholds: [] - timeFrom: - timeShift: - title: API Availability - tooltip: - msResolution: false - shared: false - sort: 0 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: none - label: '' - logBase: 1 - max: 1 - min: 0 - show: false - - format: short - logBase: 1 - max: - min: - show: false - - aliasColors: - '{status_code="2xx"}': "#629E51" - '{status_code="5xx"}': "#BF1B00" - bars: true - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 0 - grid: {} - id: 8 - interval: "> 60s" - legend: - alignAsTable: false - avg: false - current: false - hideEmpty: false - max: false - min: false - rightSide: false - show: true - total: false - values: false - lines: false - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 8 - stack: true - steppedLine: false - targets: - - expr: sum(nginx_responses_total{server_zone=~"[[Service]].*",region="$region"}) by (status_code) - format: time_series - intervalFactor: 2 - refId: A - step: 120 - thresholds: [] - timeFrom: - timeShift: - title: Number of HTTP responses - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - logBase: 1 - max: - min: 0 - show: true - - format: short - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Service Status - titleSize: h6 - schemaVersion: 14 - style: dark - tags: [] - templating: - enable: true - list: - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - allValue: - current: {} - datasource: prometheus - hide: 0 - includeAll: false - label: region - multi: false - name: region - options: [] - query: label_values(openstack_exporter_cache_refresh_duration_seconds, region) - refresh: 1 - regex: '' - sort: 0 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - - allValue: - current: - tags: [] - text: cinder - value: cinder - hide: 0 - includeAll: false - label: - multi: false - name: Service - options: - - selected: false - text: nova - value: nova - - selected: false - text: glance - value: glance - - selected: false - text: keystone - value: keystone - - selected: true - text: cinder - value: cinder - - selected: false - text: heat - value: heat - - selected: false - text: placement - value: placement - - selected: false - text: neutron - value: neutron - query: nova,glance,keystone,cinder,heat,placement,neutron - type: custom - time: - from: now-1h - to: now - timepicker: - collapse: false - enable: true - notice: false - now: true - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - status: Stable - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - type: timepicker - timezone: browser - title: Openstack Service - version: 4 - prometheus: - __inputs: - - name: DS_PROMETHEUS - label: Prometheus - description: Prometheus which you want to monitor - type: datasource - pluginId: prometheus - pluginName: Prometheus - __requires: - - type: grafana - id: grafana - name: Grafana - version: 4.6.0 - - type: panel - id: graph - name: Graph - version: '' - - type: datasource - id: prometheus - name: Prometheus - version: 1.0.0 - - type: panel - id: singlestat - name: Singlestat - version: '' - - type: panel - id: text - name: Text - version: '' - annotations: - list: - - builtIn: 1 - datasource: "-- Grafana --" - enable: true - hide: true - iconColor: rgba(0, 211, 255, 1) - name: Annotations & Alerts - type: dashboard - - datasource: "${DS_PROMETHEUS}" - enable: true - expr: count(sum(up{instance="$instance"}) by (instance) < 1) - hide: false - iconColor: rgb(250, 44, 18) - limit: 100 - name: downage - showIn: 0 - step: 30s - tagKeys: instance - textFormat: prometheus down - titleFormat: Downage - type: alert - - datasource: "${DS_PROMETHEUS}" - enable: true - expr: sum(changes(prometheus_config_last_reload_success_timestamp_seconds[10m])) - by (instance) - hide: false - iconColor: "#fceaca" - limit: 100 - name: Reload - showIn: 0 - step: 5m - tagKeys: instance - tags: [] - titleFormat: Reload - type: tags - description: Dashboard for monitoring of Prometheus v2.x.x - editable: true - gnetId: 3681 - graphTooltip: 1 - hideControls: false - id: - links: - - icon: info - tags: [] - targetBlank: true - title: 'Dashboard''s Github ' - tooltip: Github repo of this dashboard - type: link - url: https://github.com/FUSAKLA/Prometheus2-grafana-dashboard - - icon: doc - tags: [] - targetBlank: true - title: Prometheus Docs - tooltip: '' - type: link - url: http://prometheus.io/docs/introduction/overview/ - refresh: 5m - rows: - - collapse: false - height: 161 - panels: - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - "#299c46" - - rgba(237, 129, 40, 0.89) - - "#bf1b00" - datasource: "${DS_PROMETHEUS}" - decimals: 1 - format: s - gauge: - maxValue: 1000000 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 41 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: time() - process_start_time_seconds{instance="$instance"} - format: time_series - instant: false - intervalFactor: 2 - refId: A - thresholds: '' - title: Uptime - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - "#299c46" - - rgba(237, 129, 40, 0.89) - - "#bf1b00" - datasource: "${DS_PROMETHEUS}" - format: short - gauge: - maxValue: 1000000 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 42 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 4 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: true - tableColumn: '' - targets: - - expr: prometheus_tsdb_head_series{instance="$instance"} - format: time_series - instant: false - intervalFactor: 2 - refId: A - thresholds: '500000,800000,1000000' - title: Total count of time series - type: singlestat - valueFontSize: 150% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - "#299c46" - - rgba(237, 129, 40, 0.89) - - "#d44a3a" - datasource: "${DS_PROMETHEUS}" - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 48 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: version - targets: - - expr: prometheus_build_info{instance="$instance"} - format: table - instant: true - intervalFactor: 2 - refId: A - thresholds: '' - title: Version - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - - cacheTimeout: - colorBackground: false - colorValue: false - colors: - - "#299c46" - - rgba(237, 129, 40, 0.89) - - "#d44a3a" - datasource: "${DS_PROMETHEUS}" - decimals: 2 - format: ms - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 49 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 2 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: prometheus_tsdb_head_max_time{instance="$instance"} - prometheus_tsdb_head_min_time{instance="$instance"} - format: time_series - instant: true - intervalFactor: 2 - refId: A - thresholds: '' - title: Actual head block length - type: singlestat - valueFontSize: 80% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: current - - content: - height: '' - id: 50 - links: [] - mode: html - span: 1 - title: '' - transparent: true - type: text - - cacheTimeout: - colorBackground: false - colorValue: true - colors: - - "#e6522c" - - rgba(237, 129, 40, 0.89) - - "#299c46" - datasource: "${DS_PROMETHEUS}" - decimals: 1 - format: none - gauge: - maxValue: 100 - minValue: 0 - show: false - thresholdLabels: false - thresholdMarkers: true - id: 52 - interval: - links: [] - mappingType: 1 - mappingTypes: - - name: value to text - value: 1 - - name: range to text - value: 2 - maxDataPoints: 100 - nullPointMode: connected - nullText: - postfix: '' - postfixFontSize: 50% - prefix: '' - prefixFontSize: 50% - rangeMaps: - - from: 'null' - text: N/A - to: 'null' - span: 1 - sparkline: - fillColor: rgba(31, 118, 189, 0.18) - full: false - lineColor: rgb(31, 120, 193) - show: false - tableColumn: '' - targets: - - expr: '2' - format: time_series - intervalFactor: 2 - refId: A - thresholds: '10,20' - title: '' - transparent: true - type: singlestat - valueFontSize: 200% - valueMaps: - - op: "=" - text: N/A - value: 'null' - valueName: avg - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Header instance info - titleSize: h6 - - collapse: false - height: '250' - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 15 - legend: - avg: true - current: false - max: false - min: false - show: false - total: false - values: true - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: true - steppedLine: false - targets: - - expr: max(prometheus_engine_query_duration_seconds{instance="$instance"}) by - (instance, slice) - format: time_series - intervalFactor: 1 - legendFormat: max duration for {{slice}} - metric: prometheus_local_storage_rushed_mode - refId: A - step: 900 - thresholds: [] - timeFrom: - timeShift: - title: Query elapsed time - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: '' - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 17 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_tsdb_head_series_created_total{instance="$instance"}[$aggregation_interval])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: created on {{ instance }} - metric: prometheus_local_storage_maintain_series_duration_seconds_count - refId: A - step: 1800 - - expr: sum(increase(prometheus_tsdb_head_series_removed_total{instance="$instance"}[$aggregation_interval])) - by (instance) * -1 - format: time_series - intervalFactor: 2 - legendFormat: removed on {{ instance }} - refId: B - thresholds: [] - timeFrom: - timeShift: - title: Head series created/deleted - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 13 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_target_scrapes_exceeded_sample_limit_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: exceeded_sample_limit on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: A - step: 1800 - - expr: sum(increase(prometheus_target_scrapes_sample_duplicate_timestamp_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: duplicate_timestamp on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: B - step: 1800 - - expr: sum(increase(prometheus_target_scrapes_sample_out_of_bounds_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: out_of_bounds on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: C - step: 1800 - - expr: sum(increase(prometheus_target_scrapes_sample_out_of_order_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: out_of_order on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: D - step: 1800 - - expr: sum(increase(prometheus_rule_evaluation_failures_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: rule_evaluation_failure on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: G - step: 1800 - - expr: sum(increase(prometheus_tsdb_compactions_failed_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: tsdb_compactions_failed on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: K - step: 1800 - - expr: sum(increase(prometheus_tsdb_reloads_failures_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: tsdb_reloads_failures on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: L - step: 1800 - - expr: sum(increase(prometheus_tsdb_head_series_not_found{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: head_series_not_found on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: N - step: 1800 - - expr: sum(increase(prometheus_evaluator_iterations_missed_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: evaluator_iterations_missed on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: O - step: 1800 - - expr: sum(increase(prometheus_evaluator_iterations_skipped_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: evaluator_iterations_skipped on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: P - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Prometheus errors - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: false - title: Main info - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - description: '' - editable: true - error: false - fill: 1 - grid: {} - id: 25 - legend: - alignAsTable: true - avg: true - current: true - max: true - min: false - show: false - sort: max - sortDesc: true - total: false - values: true - lines: true - linewidth: 2 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: prometheus_target_interval_length_seconds{instance="$instance",quantile="0.99"} - - 60 - format: time_series - interval: 2m - intervalFactor: 1 - legendFormat: "{{instance}}" - metric: '' - refId: A - step: 300 - thresholds: [] - timeFrom: - timeShift: - title: Scrape delay (counts with 1m scrape interval) - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: cumulative - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - logBase: 1 - max: - min: - show: true - - format: short - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 14 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: Queue length - yaxis: 2 - spaceLength: 10 - span: 6 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_evaluator_duration_seconds{instance="$instance"}) by (instance, - quantile) - format: time_series - intervalFactor: 2 - legendFormat: Queue length - metric: prometheus_local_storage_indexing_queue_length - refId: B - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Rule evaulation duration - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Scrape & rule duration - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 18 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(http_requests_total{instance="$instance"}[$aggregation_interval])) - by (instance, handler) > 0 - format: time_series - intervalFactor: 2 - legendFormat: "{{ handler }} on {{ instance }}" - metric: '' - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Request count - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: none - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 16 - legend: - avg: false - current: false - hideEmpty: true - hideZero: true - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: max(sum(http_request_duration_microseconds{instance="$instance"}) by (instance, - handler, quantile)) by (instance, handler) > 0 - format: time_series - hide: false - intervalFactor: 2 - legendFormat: "{{ handler }} on {{ instance }}" - refId: B - thresholds: [] - timeFrom: - timeShift: - title: Request duration per handler - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: µs - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 19 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(http_request_size_bytes{instance="$instance", quantile="0.99"}[$aggregation_interval])) - by (instance, handler) > 0 - format: time_series - hide: false - intervalFactor: 2 - legendFormat: "{{ handler }} in {{ instance }}" - refId: B - thresholds: [] - timeFrom: - timeShift: - title: Request size by handler - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Allocated bytes: "#F9BA8F" - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max count collector: "#bf1b00" - Max count harvester: "#bf1b00" - Max to persist: "#3F6833" - RSS: "#890F02" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 8 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/Max.*/" - fill: 0 - linewidth: 2 - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_engine_queries{instance="$instance"}) by (instance, handler) - format: time_series - intervalFactor: 2 - legendFormat: 'Current count ' - metric: last - refId: A - step: 1800 - - expr: sum(prometheus_engine_queries_concurrent_max{instance="$instance"}) by - (instance, handler) - format: time_series - intervalFactor: 2 - legendFormat: Max count - metric: last - refId: B - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Cont of concurent queries - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Requests & queries - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Alert queue capacity on o collector: "#bf1b00" - Alert queue capacity on o harvester: "#bf1b00" - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 20 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/.*capacity.*/" - fill: 0 - linewidth: 2 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_notifications_queue_capacity{instance="$instance"})by (instance) - format: time_series - intervalFactor: 2 - legendFormat: 'Alert queue capacity ' - metric: prometheus_local_storage_checkpoint_last_size_bytes - refId: A - step: 1800 - - expr: sum(prometheus_notifications_queue_length{instance="$instance"})by (instance) - format: time_series - intervalFactor: 2 - legendFormat: 'Alert queue size on ' - metric: prometheus_local_storage_checkpoint_last_size_bytes - refId: B - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Alert queue size - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 21 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_notifications_alertmanagers_discovered{instance="$instance"}) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: Checkpoint chunks written/s - metric: prometheus_local_storage_checkpoint_series_chunks_written_sum - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Count of discovered alertmanagers - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: none - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 39 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_notifications_dropped_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: notifications_dropped on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: F - step: 1800 - - expr: sum(increase(prometheus_rule_evaluation_failures_total{rule_type="alerting",instance="$instance"}[$aggregation_interval])) - by (rule_type,instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: rule_evaluation_failures on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Alerting errors - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Alerting - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 45 - legend: - avg: false - current: false - max: false - min: false - show: true - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: increase(prometheus_target_sync_length_seconds_count{scrape_job="kubernetes-service-endpoints"}[$aggregation_interval]) - format: time_series - intervalFactor: 2 - legendFormat: Count of target synces - refId: A - step: 240 - thresholds: [] - timeFrom: - timeShift: - title: Kubernetes SD sync count - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 46 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_target_scrapes_exceeded_sample_limit_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: exceeded_sample_limit on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: A - step: 1800 - - expr: sum(increase(prometheus_sd_file_read_errors_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - interval: '' - intervalFactor: 2 - legendFormat: sd_file_read_error on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: E - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Service discovery errors - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Service discovery - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 36 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_tsdb_reloads_total{instance="$instance"}[30m])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: "{{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: Reloaded block from disk - tooltip: - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 5 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_tsdb_blocks_loaded{instance="$instance"}) by (instance) - format: time_series - intervalFactor: 2 - legendFormat: Loaded data blocks - metric: prometheus_local_storage_memory_chunkdescs - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Loaded data blocks - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 3 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: prometheus_tsdb_head_series{instance="$instance"} - format: time_series - intervalFactor: 2 - legendFormat: Time series count - metric: prometheus_local_storage_memory_series - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Time series total count - tooltip: - msResolution: false - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 1 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(rate(prometheus_tsdb_head_samples_appended_total{instance="$instance"}[$aggregation_interval])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: samples/s {{instance}} - metric: prometheus_local_storage_ingested_samples_total - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Samples Appended per second - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: '' - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: TSDB stats - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - To persist: "#9AC48A" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 2 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/Max.*/" - fill: 0 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_tsdb_head_chunks{instance="$instance"}) by (instance) - format: time_series - hide: false - intervalFactor: 2 - legendFormat: Head chunk count - metric: prometheus_local_storage_memory_chunks - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Head chunks count - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 35 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: max(prometheus_tsdb_head_max_time{instance="$instance"}) by (instance) - - min(prometheus_tsdb_head_min_time{instance="$instance"}) by (instance) - format: time_series - intervalFactor: 2 - legendFormat: "{{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: Length of head block - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: ms - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 4 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(prometheus_tsdb_head_chunks_created_total{instance="$instance"}[$aggregation_interval])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: created on {{ instance }} - refId: B - - expr: sum(rate(prometheus_tsdb_head_chunks_removed_total{instance="$instance"}[$aggregation_interval])) - by (instance) * -1 - format: time_series - intervalFactor: 2 - legendFormat: deleted on {{ instance }} - refId: C - thresholds: [] - timeFrom: - timeShift: - title: Head Chunks Created/Deleted per second - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Head block stats - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 33 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(increase(prometheus_tsdb_compaction_duration_sum{instance="$instance"}[30m]) - / increase(prometheus_tsdb_compaction_duration_count{instance="$instance"}[30m])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: "{{ instance }}" - refId: B - thresholds: [] - timeFrom: - timeShift: - title: Compaction duration - tooltip: - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 34 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_tsdb_head_gc_duration_seconds{instance="$instance"}) by - (instance, quantile) - format: time_series - intervalFactor: 2 - legendFormat: "{{ quantile }} on {{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: Go Garbage collection duration - tooltip: - shared: true - sort: 0 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 37 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(prometheus_tsdb_wal_truncate_duration_seconds{instance="$instance"}) - by (instance, quantile) - format: time_series - intervalFactor: 2 - legendFormat: "{{ quantile }} on {{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: WAL truncate duration seconds - tooltip: - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - fill: 1 - id: 38 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: connected - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 3 - stack: false - steppedLine: false - targets: - - expr: sum(tsdb_wal_fsync_duration_seconds{instance="$instance"}) by (instance, - quantile) - format: time_series - intervalFactor: 2 - legendFormat: "{{ quantile }} {{ instance }}" - refId: A - thresholds: [] - timeFrom: - timeShift: - title: WAL fsync duration seconds - tooltip: - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: s - label: - logBase: 1 - max: - min: - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Data maintenance - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Allocated bytes: "#7EB26D" - Allocated bytes - 1m max: "#BF1B00" - Allocated bytes - 1m min: "#BF1B00" - Allocated bytes - 5m max: "#BF1B00" - Allocated bytes - 5m min: "#BF1B00" - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - RSS: "#447EBC" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - decimals: - editable: true - error: false - fill: 1 - id: 6 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: - - alias: "/-/" - fill: 0 - - alias: collector heap size - color: "#E0752D" - fill: 0 - linewidth: 2 - - alias: collector kubernetes memory limit - color: "#BF1B00" - fill: 0 - linewidth: 3 - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(process_resident_memory_bytes{instance="$instance"}) by (instance) - format: time_series - hide: false - intervalFactor: 2 - legendFormat: Total resident memory - {{instance}} - metric: process_resident_memory_bytes - refId: B - step: 1800 - - expr: sum(go_memstats_alloc_bytes{instance="$instance"}) by (instance) - format: time_series - hide: false - intervalFactor: 2 - legendFormat: Total llocated bytes - {{instance}} - metric: go_memstats_alloc_bytes - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Memory - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: - Allocated bytes: "#F9BA8F" - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - RSS: "#890F02" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 7 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: rate(go_memstats_alloc_bytes_total{instance="$instance"}[$aggregation_interval]) - format: time_series - intervalFactor: 2 - legendFormat: Allocated Bytes/s - metric: go_memstats_alloc_bytes - refId: A - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Allocations per second - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: bytes - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - - aliasColors: {} - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - decimals: 2 - editable: true - error: false - fill: 1 - id: 9 - legend: - alignAsTable: false - avg: false - current: false - hideEmpty: false - max: false - min: false - rightSide: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 4 - stack: false - steppedLine: false - targets: - - expr: sum(rate(process_cpu_seconds_total{instance="$instance"}[$aggregation_interval])) - by (instance) - format: time_series - intervalFactor: 2 - legendFormat: CPU/s - metric: prometheus_local_storage_ingested_samples_total - refId: B - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: CPU per second - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: - - avg - yaxes: - - format: none - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: RAM&CPU - titleSize: h6 - - collapse: false - height: 250 - panels: - - aliasColors: - Chunks: "#1F78C1" - Chunks to persist: "#508642" - Max chunks: "#052B51" - Max to persist: "#3F6833" - bars: false - dashLength: 10 - dashes: false - datasource: "${DS_PROMETHEUS}" - editable: true - error: false - fill: 1 - id: 47 - legend: - avg: false - current: false - max: false - min: false - show: false - total: false - values: false - lines: true - linewidth: 1 - links: [] - nullPointMode: 'null' - percentage: false - pointradius: 5 - points: false - renderer: flot - seriesOverrides: [] - spaceLength: 10 - span: 12 - stack: false - steppedLine: false - targets: - - expr: sum(increase(net_conntrack_dialer_conn_failed_total{instance="$instance"}[$aggregation_interval])) - by (instance) > 0 - format: time_series - hide: false - interval: '' - intervalFactor: 2 - legendFormat: conntrack_dialer_conn_failed on {{ instance }} - metric: prometheus_local_storage_chunk_ops_total - refId: M - step: 1800 - thresholds: [] - timeFrom: - timeShift: - title: Net errors - tooltip: - msResolution: false - shared: true - sort: 2 - value_type: individual - type: graph - xaxis: - buckets: - mode: time - name: - show: true - values: [] - yaxes: - - format: short - label: - logBase: 1 - max: - min: '0' - show: true - - format: short - label: - logBase: 1 - max: - min: - show: true - repeat: - repeatIteration: - repeatRowId: - showTitle: true - title: Contrac errors - titleSize: h6 - schemaVersion: 14 - style: dark - tags: - - prometheus - templating: - list: - - auto: true - auto_count: 30 - auto_min: 2m - current: - text: auto - value: "$__auto_interval" - hide: 0 - label: aggregation intarval - name: aggregation_interval - options: - - selected: true - text: auto - value: "$__auto_interval" - - selected: false - text: 1m - value: 1m - - selected: false - text: 10m - value: 10m - - selected: false - text: 30m - value: 30m - - selected: false - text: 1h - value: 1h - - selected: false - text: 6h - value: 6h - - selected: false - text: 12h - value: 12h - - selected: false - text: 1d - value: 1d - - selected: false - text: 7d - value: 7d - - selected: false - text: 14d - value: 14d - - selected: false - text: 30d - value: 30d - query: 1m,10m,30m,1h,6h,12h,1d,7d,14d,30d - refresh: 2 - type: interval - - allValue: - current: {} - datasource: "${DS_PROMETHEUS}" - hide: 0 - includeAll: false - label: Instance - multi: false - name: instance - options: [] - query: label_values(prometheus_build_info, instance) - refresh: 2 - regex: '' - sort: 2 - tagValuesQuery: '' - tags: [] - tagsQuery: '' - type: query - useTags: false - - current: - text: Prometheus - value: Prometheus - hide: 0 - label: Prometheus datasource - name: DS_PROMETHEUS - options: [] - query: prometheus - refresh: 1 - regex: '' - type: datasource - - current: - text: influxdb(heapster) - kokura - value: influxdb(heapster) - kokura - hide: 0 - label: InfluxDB datasource - name: influx_datasource - options: [] - query: influxdb - refresh: 1 - regex: '' - type: datasource - time: - from: now-7d - to: now - timepicker: - refresh_intervals: - - 5s - - 10s - - 30s - - 1m - - 5m - - 15m - - 30m - - 1h - - 2h - - 1d - time_options: - - 5m - - 15m - - 1h - - 6h - - 12h - - 24h - - 2d - - 7d - - 30d - timezone: browser - title: Prometheus2.0 (v1.0.0 by FUSAKLA) - version: 8 + home_dashboard: |- + { + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": true, + "gnetId": null, + "graphTooltip": 0, + "id": 66, + "links": [], + "panels": [ + { + "content": "
\n ATT Home Dashboard\n
\n
\n AT&T Proprietary (Internal Use Only)\n
", + "editable": true, + "gridPos": { + "h": 3, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 1, + "links": [], + "mode": "html", + "options": {}, + "style": {}, + "title": "", + "transparent": true, + "type": "text" + }, + { + "folderId": 0, + "gridPos": { + "h": 10, + "w": 13, + "x": 6, + "y": 3 + }, + "headings": true, + "id": 3, + "limit": 30, + "links": [], + "options": {}, + "query": "", + "recent": true, + "search": false, + "starred": true, + "tags": [], + "title": "", + "type": "dashlist" + } + ], + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "hidden": true, + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ], + "type": "timepicker" + }, + "timezone": "browser", + "title": "OSH Home", + "version": 1 + } + ceph_cluster: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Ceph Cluster overview.\r\n", + "editable": false, + "overwrite": true, + "gnetId": 917, + "graphTooltip": 0, + "id": 134, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 35, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 21, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "avg(ceph_health_status{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=~\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "1,1", + "title": "Status", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + }, + { + "op": "=", + "text": "HEALTHY", + "value": "0" + }, + { + "op": "=", + "text": "WARNING", + "value": "1" + }, + { + "op": "=", + "text": "CRITICAL", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 22, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "count(ceph_pool_max_avail{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "", + "title": "Pools", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 8, + "y": 1 + }, + "id": 33, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "avg(ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "0.025,0.1", + "title": "Cluster Capacity", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 12, + "y": 1 + }, + "id": 34, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "avg(ceph_cluster_total_used_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "0.025,0.1", + "title": "Used Capacity", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percentunit", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 16, + "y": 1 + }, + "id": 23, + "interval": "1m", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "avg(ceph_cluster_total_used_bytes/ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "70,80", + "title": "Current Utilization", + "type": "singlestat", + "valueFontSize": "100%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": { + "Available": "#EAB839", + "Total Capacity": "#447EBC", + "Used": "#BF1B00", + "total_avail": "#6ED0E0", + "total_space": "#7EB26D", + "total_used": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 5, + "grid": {}, + "gridPos": { + "h": 8, + "w": 8, + "x": 0, + "y": 5 + }, + "height": "300", + "id": 39, + "interval": "", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 5, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "ceph_health_status{application=\"ceph\",component=\"manager\",instance=\"172.29.0.26:9283\",job=\"ceph-mgr\",namespace=\"ceph\",release_group=\"clcp-ucp-ceph-client\"}", + "fill": 0, + "linewidth": 3, + "stack": false + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "ceph_health_status{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "ceph-health", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Status (0-Healthy, 1-Warning, 2-Critical)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "columns": [ + { + "text": "Current", + "value": "current" + } + ], + "datasource": "${DS_PROMETHEUS}", + "fontSize": "100%", + "gridPos": { + "h": 8, + "w": 8, + "x": 8, + "y": 5 + }, + "id": 40, + "links": [], + "options": {}, + "pageSize": null, + "scroll": true, + "showHeader": true, + "sort": { + "col": 0, + "desc": true + }, + "styles": [ + { + "alias": "Time", + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "pattern": "Time", + "type": "date" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "decimals": 2, + "pattern": "/.*/", + "thresholds": [], + "type": "number", + "unit": "short" + } + ], + "targets": [ + { + "expr": "ceph_mgr_status{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{job}} {{ceph_daemon}}", + "refId": "A", + "step": 60 + } + ], + "timeFrom": null, + "timeShift": null, + "title": "Cluster Manager", + "transform": "timeseries_aggregations", + "type": "table" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 13 + }, + "id": 36, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 0, + "y": 14 + }, + "id": 26, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ceph_osd_in{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "", + "title": "OSDs IN", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 40, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 2, + "y": 14 + }, + "id": 27, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}) - sum(ceph_osd_in{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "1,1", + "title": "OSDs OUT", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 4, + "y": 14 + }, + "id": 28, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ceph_osd_up{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "", + "title": "OSDs UP", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 40, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 6, + "y": 14 + }, + "id": 29, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}) - sum(ceph_osd_up{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "1,1", + "title": "OSDs DOWN", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 8, + "y": 14 + }, + "id": 30, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "avg(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "250,300", + "title": "Average PGs per OSD", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 17 + }, + "id": 37, + "panels": [], + "repeat": null, + "title": "CLUSTER", + "type": "row" + }, + { + "aliasColors": { + "Available": "#EAB839", + "Total Capacity": "#447EBC", + "Used": "#BF1B00", + "total_avail": "#6ED0E0", + "total_space": "#7EB26D", + "total_used": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 4, + "grid": {}, + "gridPos": { + "h": 8, + "w": 8, + "x": 0, + "y": 18 + }, + "height": "300", + "id": 1, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 0, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "Total Capacity", + "fill": 0, + "linewidth": 3, + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_cluster_total_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"} - ceph_cluster_total_used_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Available", + "refId": "A", + "step": 60 + }, + { + "expr": "ceph_cluster_total_used_bytes{nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Used", + "refId": "B", + "step": 60 + }, + { + "expr": "ceph_cluster_total_bytes{nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Total Capacity", + "refId": "C", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Capacity", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Total Capacity": "#7EB26D", + "Used": "#BF1B00", + "total_avail": "#6ED0E0", + "total_space": "#7EB26D", + "total_used": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 8, + "w": 8, + "x": 8, + "y": 18 + }, + "height": "300", + "id": 3, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_osd_op_w{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Write", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(ceph_osd_op_r{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Read", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "IOPS", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 8, + "w": 8, + "x": 16, + "y": 18 + }, + "height": "300", + "id": 7, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_osd_op_in_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Write", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(ceph_osd_op_out_bytes{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Read", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Throughput", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 26 + }, + "id": 38, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 27 + }, + "id": 18, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Total.*$/", + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_pool_objects{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Total", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Objects in the Cluster", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 34 + }, + "id": 19, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Total.*$/", + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Total", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(ceph_pg_active{application=\"ceph\",release_group=\"$ceph_cluster\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Active", + "refId": "B", + "step": 60 + }, + { + "expr": "sum(ceph_pg_inconsistent{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Inconsistent", + "refId": "C", + "step": 60 + }, + { + "expr": "sum(ceph_pg_creating{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Creating", + "refId": "D", + "step": 60 + }, + { + "expr": "sum(ceph_pg_recovering{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Recovering", + "refId": "E", + "step": 60 + }, + { + "expr": "sum(ceph_pg_down{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Down", + "refId": "F", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "PGs", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 34 + }, + "id": 20, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Total.*$/", + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(ceph_pg_degraded{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Degraded", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(ceph_pg_stale{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Stale", + "refId": "B", + "step": 60 + }, + { + "expr": "sum(ceph_pg_undersized{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Undersized", + "refId": "C", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Stuck PGs", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "ceph", + "cluster" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)", + "hide": 0, + "includeAll": false, + "label": "Cluster", + "multi": false, + "name": "ceph_cluster", + "options": [], + "query": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "auto": true, + "auto_count": 10, + "auto_min": "1m", + "current": { + "text": "1m", + "value": "1m" + }, + "datasource": null, + "hide": 0, + "includeAll": false, + "label": "Interval", + "multi": false, + "name": "interval", + "options": [ + { + "selected": false, + "text": "auto", + "value": "$__auto_interval_interval" + }, + { + "selected": true, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Ceph - Cluster", + "uid": "ceph-cluster", + "version": 2 + } + ceph_osd: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "Prometheus.IO", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "CEPH OSD Status.", + "editable": false, + "overwrite": true, + "gnetId": 923, + "graphTooltip": 0, + "id": 140, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 11, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 40, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 0, + "y": 1 + }, + "id": 6, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + }, + { + "from": "0", + "text": "DOWN", + "to": "0.99" + }, + { + "from": "0.99", + "text": "UP", + "to": "1" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "ceph_osd_up{ceph_daemon=\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "0,1", + "timeFrom": null, + "title": "Status", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "DOWN", + "value": "0" + }, + { + "op": "=", + "text": "UP", + "value": "1" + }, + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 40, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 2, + "y": 1 + }, + "id": 8, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + }, + { + "from": "0", + "text": "OUT", + "to": "0.99" + }, + { + "from": "0.99", + "text": "IN", + "to": "1" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "ceph_osd_in{ceph_daemon=\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "0,1", + "timeFrom": null, + "title": "Available", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "DOWN", + "value": "0" + }, + { + "op": "=", + "text": "UP", + "value": "1" + }, + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 2, + "x": 4, + "y": 1 + }, + "id": 10, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "count(ceph_osd_metadata{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "0,1", + "timeFrom": null, + "title": "Total OSDs", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "DOWN", + "value": "0" + }, + { + "op": "=", + "text": "UP", + "value": "1" + }, + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 4 + }, + "id": 12, + "panels": [], + "title": "OSD: $osd", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 20, + "x": 0, + "y": 5 + }, + "id": 5, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Average.*/", + "fill": 0, + "stack": false + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_osd_numpg{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Number of PGs - {{ $osd }}", + "refId": "A", + "step": 60 + }, + { + "expr": "avg(ceph_osd_numpg{application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Average Number of PGs in the Cluster", + "refId": "B", + "step": 60 + } + ], + "thresholds": [ + { + "colorMode": "custom", + "line": true, + "lineColor": "rgba(216, 200, 27, 0.27)", + "op": "gt", + "value": 250 + }, + { + "colorMode": "custom", + "line": true, + "lineColor": "rgba(234, 112, 112, 0.22)", + "op": "gt", + "value": 300 + } + ], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "PGs", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 20, + "y": 5 + }, + "id": 7, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "(ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}/ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})*100", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 60 + } + ], + "thresholds": "60,80", + "timeFrom": null, + "title": "Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 12 + }, + "id": 13, + "panels": [], + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 13 + }, + "id": 2, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Used - {{ osd.$osd }}", + "metric": "ceph_osd_used_bytes", + "refId": "A", + "step": 60 + }, + { + "expr": "ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"} - ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "hide": false, + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Available - {{ $osd }}", + "metric": "ceph_osd_avail_bytes", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "OSD Storage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 5, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 13 + }, + "id": 9, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": false, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": true, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "(ceph_osd_stat_bytes_used{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}/ceph_osd_stat_bytes{ceph_daemon=~\"$osd\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "Available - {{ $osd }}", + "metric": "ceph_osd_avail_bytes", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Utilization Variance", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [ + "ceph", + "osd" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)", + "hide": 0, + "includeAll": false, + "label": "Cluster", + "multi": false, + "name": "ceph_cluster", + "options": [], + "query": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "auto": true, + "auto_count": 10, + "auto_min": "1m", + "current": { + "text": "1m", + "value": "1m" + }, + "datasource": null, + "hide": 0, + "includeAll": false, + "label": "Interval", + "multi": false, + "name": "interval", + "options": [ + { + "selected": false, + "text": "auto", + "value": "$__auto_interval_interval" + }, + { + "selected": true, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "OSD", + "multi": false, + "name": "osd", + "options": [], + "query": "label_values(ceph_osd_metadata{release_group=\"$ceph_cluster\"}, ceph_daemon)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-30m", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Ceph - OSD", + "uid": "ceph-osd", + "version": 2 + } + ceph_pool: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "Prometheus.IO", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Ceph Pools dashboard.", + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 143, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 11, + "panels": [], + "title": "Pool: $pool", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 4, + "grid": {}, + "gridPos": { + "h": 7, + "w": 20, + "x": 0, + "y": 1 + }, + "height": "", + "id": 2, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 0, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/^Total.*$/", + "fill": 0, + "linewidth": 4, + "stack": false + }, + { + "alias": "/^Raw.*$/", + "color": "#BF1B00", + "fill": 0, + "linewidth": 4 + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Total - {{ $pool }}", + "refId": "A", + "step": 60 + }, + { + "expr": "ceph_pool_stored{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Used - {{ $pool }}", + "refId": "B", + "step": 60 + }, + { + "expr": "ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"} - ceph_pool_stored{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Available - {{ $pool }}", + "refId": "C", + "step": 60 + }, + { + "expr": "ceph_pool_raw_bytes_used{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Raw - {{ $pool }}", + "refId": "D", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "[[pool_name]] Pool Storage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "percentunit", + "gauge": { + "maxValue": 1, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 20, + "y": 1 + }, + "id": 10, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(ceph_pool_stored{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"} / ceph_pool_max_avail{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"})", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "refId": "A", + "step": 60 + } + ], + "thresholds": "", + "title": "[[pool_name]] Pool Usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 12, + "panels": [], + "title": "New row", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 9 + }, + "height": "", + "id": 7, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "ceph_pool_objects{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Objects - {{ $pool_name }}", + "refId": "A", + "step": 60 + }, + { + "expr": "ceph_pool_dirty{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Dirty Objects - {{ $pool_name }}", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Objects in Pool [[pool_name]]", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 9 + }, + "id": 4, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "irate(ceph_pool_rd{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}[3m])", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Read - {{ $pool_name }}", + "refId": "B", + "step": 60 + }, + { + "expr": "irate(ceph_pool_wr{pool_id=~\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}[3m])", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Write - {{ $pool_name }}", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "[[pool_name]] Pool IOPS", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "IOPS", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": "IOPS", + "logBase": 1, + "max": null, + "min": 0, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 16 + }, + "id": 5, + "interval": "$interval", + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "irate(ceph_pool_rd_bytes{pool_id=\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}[3m])", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Read Bytes - {{ $pool_name }}", + "refId": "A", + "step": 60 + }, + { + "expr": "irate(ceph_pool_wr_bytes{pool_id=\"$pool\",application=\"ceph\",release_group=\"$ceph_cluster\",nc_region=\"$region\"}[3m])", + "format": "time_series", + "interval": "$interval", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Written Bytes - {{ $pool_name }}", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "[[pool_name]] Pool Throughput", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "ceph", + "pools" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)", + "hide": 0, + "includeAll": false, + "label": "Cluster", + "multi": false, + "name": "ceph_cluster", + "options": [], + "query": "label_values(ceph_health_status{nc_region=\"$region\"}, release_group)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "auto": true, + "auto_count": 10, + "auto_min": "1m", + "current": { + "text": "1m", + "value": "1m" + }, + "datasource": null, + "hide": 0, + "includeAll": false, + "label": "Interval", + "multi": false, + "name": "interval", + "options": [ + { + "selected": false, + "text": "auto", + "value": "$__auto_interval_interval" + }, + { + "selected": true, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(ceph_pool_objects{release_group=\"$ceph_cluster\", nc_region=\"$region\"}, pool_id)", + "hide": 0, + "includeAll": false, + "label": "Pool", + "multi": false, + "name": "pool", + "options": [], + "query": "label_values(ceph_pool_objects{release_group=\"$ceph_cluster\", nc_region=\"$region\"}, pool_id)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Pool", + "multi": false, + "name": "pool_name", + "options": [], + "query": "label_values(ceph_pool_metadata{release_group=\"$ceph_cluster\",pool_id=\"[[pool]]\" }, name)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Ceph - Pools", + "uid": "ceph-pools", + "version": 5 + } + armada_dashboard: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 104, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 9, + "panels": [], + "title": "Deployment Health", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 1 + }, + "id": 23, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "armada_apply_failure_total{manifest=~\"$manifest\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Armada Apply", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Armada Apply Failures", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 1 + }, + "id": 28, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "armada_chart_deploy_attempt_total{manifest=~\"$manifest\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{chart}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Helm Chart Attempts", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 10 + }, + "id": 7, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(armada_chart_handle_failure_total{manifest=~\"$manifest\"})", + "format": "time_series", + "hide": false, + "instant": false, + "intervalFactor": 1, + "legendFormat": "Chart Failures", + "refId": "A" + }, + { + "expr": "sum(armada_chart_test_failure_total{manifest=~\"$manifest\"}) ", + "format": "time_series", + "hide": false, + "intervalFactor": 1, + "legendFormat": "Chart Test Failures", + "refId": "C" + }, + { + "expr": "sum(armada_chart_deploy_failure_total{manifest=~\"$manifest\",nc_region=~\"$region\"}) ", + "format": "time_series", + "hide": false, + "intervalFactor": 1, + "legendFormat": "Chart Deploy Failures", + "refId": "D" + }, + { + "expr": "sum(armada_chart_deploy_failure_total{manifest=~\"$manifest\",action=\"install\",nc_region=~\"$region\"}) ", + "format": "time_series", + "hide": false, + "intervalFactor": 1, + "legendFormat": "Chart Deploy Install Failures", + "refId": "B" + }, + { + "expr": "sum(armada_chart_deploy_failure_total{manifest=~\"$manifest\",action=\"upgrade\",nc_region=~\"$region\"}) ", + "format": "time_series", + "hide": false, + "intervalFactor": 1, + "legendFormat": "Chart Deploy Upgrade Failures", + "refId": "E" + }, + { + "expr": "sum(armada_chart_deploy_failure_total{manifest=~\"$manifest\",action=\"noop\",nc_region=~\"$region\"})", + "format": "time_series", + "hide": false, + "intervalFactor": 1, + "legendFormat": "Chart Deploy noop Failures", + "refId": "F" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Site Failures", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": "4", + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "columns": [], + "datasource": "${DS_PROMETHEUS}", + "fontSize": "100%", + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 10 + }, + "id": 27, + "links": [], + "options": {}, + "pageSize": null, + "scroll": true, + "showHeader": true, + "sort": { + "col": 0, + "desc": true + }, + "styles": [ + { + "alias": "Time", + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "pattern": "Time", + "type": "date" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "decimals": 2, + "pattern": "chart", + "thresholds": [], + "type": "string", + "unit": "short" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "manifest", + "thresholds": [], + "type": "string", + "unit": "short" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Value", + "thresholds": [], + "type": "number", + "unit": "short" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "/.*/", + "thresholds": [], + "type": "hidden", + "unit": "short" + } + ], + "targets": [ + { + "expr": "armada_chart_handle_failure_total{nc_region=~\"$region\"}>0", + "format": "table", + "instant": true, + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + } + ], + "title": "Failed Charts", + "transform": "table", + "type": "table" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 19 + }, + "id": 19, + "panels": [], + "title": "Deployment Progress", + "type": "row" + }, + { + "aliasColors": {}, + "bars": true, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 20 + }, + "id": 15, + "legend": { + "alignAsTable": false, + "avg": false, + "current": false, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sideWidth": null, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "armada_chart_handle_attempt_inprogress{manifest=~\"$manifest\",nc_region=~\"$region\"}>0", + "format": "time_series", + "instant": false, + "intervalFactor": 1, + "legendFormat": "{{chart}}", + "refId": "A" + }, + { + "expr": "count(armada_chart_handle_attempt_inprogress{manifest=~\"$manifest\",nc_region=~\"$region\"})", + "format": "time_series", + "hide": true, + "intervalFactor": 1, + "legendFormat": "Total chart attempts", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Deployment Progress", + "tooltip": { + "shared": false, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": "1", + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "columns": [], + "datasource": "${DS_PROMETHEUS}", + "fontSize": "100%", + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 20 + }, + "id": 21, + "links": [], + "options": {}, + "pageSize": null, + "scroll": true, + "showHeader": true, + "sort": { + "col": 0, + "desc": true + }, + "styles": [ + { + "alias": "Time", + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "pattern": "Time", + "type": "hidden" + }, + { + "alias": "Chart", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "link": false, + "pattern": "Metric", + "thresholds": [], + "type": "string", + "unit": "short" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Value", + "thresholds": [], + "type": "hidden", + "unit": "short" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "decimals": 2, + "pattern": "/.*/", + "thresholds": [], + "type": "number", + "unit": "short" + } + ], + "targets": [ + { + "expr": "armada_chart_deploy_attempt_inprogress{manifest=~\"$manifest\",nc_region=~\"$region\"}>0", + "format": "time_series", + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{chart}}", + "refId": "A" + } + ], + "title": "Current Running Charts", + "transform": "timeseries_to_rows", + "type": "table" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 29 + }, + "id": 11, + "panels": [], + "title": "Timeout usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": true, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 30 + }, + "id": 2, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 300, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": false, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "(armada_chart_deploy_timeout_usage_ratio_sum{manifest=~\"$manifest\",action=~\"$action\",nc_region=~\"$region\"})*100>10", + "format": "time_series", + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{chart}}", + "refId": "A" + } + ], + "thresholds": [ + { + "colorMode": "ok", + "fill": true, + "line": true, + "op": "gt", + "value": 0 + }, + { + "colorMode": "warning", + "fill": true, + "line": true, + "op": "gt", + "value": 50 + }, + { + "colorMode": "critical", + "fill": true, + "line": true, + "op": "gt", + "value": 80 + } + ], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Percentage Chart Timeout Usage > 10%", + "tooltip": { + "shared": false, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "series", + "name": null, + "show": false, + "values": [ + "avg" + ] + }, + "yaxes": [ + { + "format": "short", + "label": "Percentage of timeout used", + "logBase": 1, + "max": "100", + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": true, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 30 + }, + "id": 5, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 300, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": false, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "(armada_chart_deploy_timeout_usage_ratio_sum{manifest=~\"$manifest\",action=~\"$action\",nc_region=~\"$region\"})*100<10", + "format": "time_series", + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{chart}}", + "refId": "A" + } + ], + "thresholds": [ + { + "colorMode": "ok", + "fill": true, + "line": true, + "op": "lt", + "value": 10 + }, + { + "colorMode": "warning", + "fill": true, + "line": true, + "op": "lt", + "value": 5 + }, + { + "colorMode": "critical", + "fill": true, + "line": true, + "op": "lt", + "value": 1 + } + ], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Percentage Chart Timeout Usage < 10%", + "tooltip": { + "shared": false, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "series", + "name": null, + "show": false, + "values": [ + "avg" + ] + }, + "yaxes": [ + { + "decimals": null, + "format": "short", + "label": "Percentage of timeout used", + "logBase": 1, + "max": "10", + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": true, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 39 + }, + "id": 25, + "legend": { + "alignAsTable": true, + "avg": false, + "current": false, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 300, + "sortDesc": false, + "total": false, + "values": true + }, + "lines": false, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "armada_chart_handle_concurrency_count_sum{manifest=~\"$manifest\",nc_region=~\"$region\"}/armada_chart_handle_concurrency_count_count{manifest=~\"$manifest\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{chart}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Max Concurrency by Chart", + "tooltip": { + "shared": false, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "series", + "name": null, + "show": false, + "values": [ + "max" + ] + }, + "yaxes": [ + { + "format": "short", + "label": "Concurrency", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + "selected": false, + "tags": [], + "text": "full-site", + "value": [ + "full-site" + ] + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "Manifest", + "multi": true, + "name": "manifest", + "options": [ + { + "selected": true, + "text": "full-site", + "value": "full-site" + } + ], + "query": "armada_apply_attempt_total", + "refresh": 0, + "regex": "/.*manifest=\"(.*?)\".*/", + "skipUrlSync": false, + "sort": 1, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + "tags": [], + "text": "install + upgrade", + "value": [ + "install", + "upgrade" + ] + }, + "hide": 0, + "includeAll": false, + "label": "Armada Action", + "multi": true, + "name": "action", + "options": [ + { + "selected": true, + "text": "install", + "value": "install" + }, + { + "selected": false, + "text": "upgrade", + "value": "upgrade" + }, + { + "selected": false, + "text": "noop", + "value": "noop" + } + ], + "query": "install,upgrade,noop", + "skipUrlSync": false, + "type": "custom" + } + ] + }, + "time": { + "from": "now-6h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "browser", + "title": "Armada Dashboard", + "uid": "armada-dashboard", + "version": 1 + } + containers: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.3.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Monitors Kubernetes cluster using Prometheus. Shows overall cluster CPU / Memory / Filesystem usage as well as individual pod, containers, systemd services statistics. Uses cAdvisor metrics only.", + "editable": false, + "overwrite": true, + "gnetId": 315, + "graphTooltip": 0, + "id": 209, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 33, + "panels": [], + "title": "Network I/O pressure", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 5, + "w": 24, + "x": 0, + "y": 1 + }, + "height": "200px", + "id": 32, + "isNew": true, + "legend": { + "alignAsTable": false, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (container_network_receive_bytes_total{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[10m]))", + "format": "time_series", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "Received", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[10m]))", + "format": "time_series", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "Sent", + "metric": "network", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network I/O pressure", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 6 + }, + "id": 34, + "panels": [], + "title": "Total usage", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 8, + "x": 0, + "y": 7 + }, + "height": "180px", + "id": 4, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{id=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) / sum (machine_memory_bytes{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) * 100", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "65, 90", + "title": "Cluster memory usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 8, + "x": 8, + "y": 7 + }, + "height": "180px", + "id": 6, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{id=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) / sum (machine_cpu_cores{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) * 100", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "65, 90", + "title": "Cluster CPU usage (5m avg)", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 8, + "x": 16, + "y": 7 + }, + "height": "180px", + "id": 7, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "max(sum (container_fs_usage_bytes{device=~\"^/dev/[sv]da[0-9]$\",nc_region=~\"$region\"}) by (kubernetes_io_hostname) / sum (container_fs_limit_bytes{device=~\"^/dev/[sv]da[0-9]$\",nc_region=~\"$region\"}) by (kubernetes_io_hostname) * 100)", + "format": "time_series", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": "65, 90", + "title": "Cluster filesystem usage", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 0, + "y": 12 + }, + "height": "1px", + "id": 9, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "20%", + "prefix": "", + "prefixFontSize": "20%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{id=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"})", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Used", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 4, + "y": 12 + }, + "height": "1px", + "id": 10, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (machine_memory_bytes{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"})", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Total", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 8, + "y": 12 + }, + "height": "1px", + "id": 11, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": " cores", + "postfixFontSize": "30%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{id=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m]))", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Used", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 12, + "y": 12 + }, + "height": "1px", + "id": 12, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": " cores", + "postfixFontSize": "30%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (machine_cpu_cores{kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"})", + "interval": "10s", + "intervalFactor": 1, + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Total", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 16, + "y": 12 + }, + "height": "1px", + "id": 13, + "interval": "", + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum (container_fs_usage_bytes{device=~\"^/dev/[sv]da[0-9]$\",nc_region=~\"$region\"})", + "format": "time_series", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Used", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "$DS_PROMETHEUS", + "decimals": 2, + "editable": true, + "error": false, + "format": "bytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 20, + "y": 12 + }, + "height": "1px", + "id": 14, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(container_fs_limit_bytes{device=~\"^/dev/[sv]da[0-9]$\",nc_region=~\"$region\"})", + "format": "time_series", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": "", + "title": "Total", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 15 + }, + "id": 35, + "panels": [], + "title": "Pods CPU usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 3, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 16 + }, + "height": "", + "id": 17, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ pod }}", + "metric": "container_cpu", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Pods CPU usage (5m avg)", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 23 + }, + "id": 36, + "panels": [], + "title": "Containers CPU usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 3, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 24 + }, + "height": "", + "id": 24, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": null, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",name=~\"^k8s_.*\",container!=\"POD\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (container, pod)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "pod: {{ pod }} | {{ container }}", + "metric": "container_cpu", + "refId": "A", + "step": 10 + }, + { + "expr": "sum (rate (container_cpu_usage_seconds_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, name, image)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})", + "metric": "container_cpu", + "refId": "B", + "step": 10 + }, + { + "expr": "sum (rate (container_cpu_usage_seconds_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}", + "metric": "container_cpu", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Containers CPU usage (5m avg)", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 31 + }, + "id": 37, + "panels": [], + "repeat": null, + "title": "All processes CPU usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 3, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 13, + "w": 24, + "x": 0, + "y": 32 + }, + "id": 20, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (rate (container_cpu_usage_seconds_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (id)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ id }}", + "metric": "container_cpu", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "All processes CPU usage (5m avg)", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 45 + }, + "id": 38, + "panels": [], + "title": "Pods memory usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 46 + }, + "id": 25, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{image!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ pod }}", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Pods memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 53 + }, + "id": 39, + "panels": [], + "title": "Containers memory usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 54 + }, + "id": 27, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{image!=\"\",name=~\"^k8s_.*\",container!=\"POD\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (container, pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "pod: {{ pod }} | {{ container }}", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + }, + { + "expr": "sum (container_memory_working_set_bytes{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (kubernetes_io_hostname, name, image)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})", + "metric": "container_memory_usage:sort_desc", + "refId": "B", + "step": 10 + }, + { + "expr": "sum (container_memory_working_set_bytes{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (kubernetes_io_hostname, rkt_container_name)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}", + "metric": "container_memory_usage:sort_desc", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Containers memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 61 + }, + "id": 40, + "panels": [], + "title": "All processes memory usage", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 13, + "w": 24, + "x": 0, + "y": 62 + }, + "id": 28, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "sum (container_memory_working_set_bytes{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}) by (id)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ id }}", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "All processes memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 75 + }, + "id": 41, + "panels": [], + "title": "Pods network I/O", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 76 + }, + "id": 16, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> {{ pod }}", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (pod)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- {{ pod }}", + "metric": "network", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Pods network I/O (5m avg)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 83 + }, + "id": 42, + "panels": [], + "title": "Containers network I/O", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 84 + }, + "id": 30, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",name=~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (container, pod)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> pod: {{ pod }} | {{ container }}", + "metric": "network", + "refId": "B", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",name=~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (container, pod)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- pod: {{ pod }} | {{ container }}", + "metric": "network", + "refId": "D", + "step": 10 + }, + { + "expr": "sum (rate (container_network_receive_bytes_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, name, image)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{image!=\"\",name!~\"^k8s_.*\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, name, image)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- docker: {{ kubernetes_io_hostname }} | {{ image }} ({{ name }})", + "metric": "network", + "refId": "C", + "step": 10 + }, + { + "expr": "sum (rate (container_network_transmit_bytes_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}", + "metric": "network", + "refId": "E", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{rkt_container_name!=\"\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (kubernetes_io_hostname, rkt_container_name)", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- rkt: {{ kubernetes_io_hostname }} | {{ rkt_container_name }}", + "metric": "network", + "refId": "F", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Containers network I/O (5m avg)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 91 + }, + "id": 43, + "panels": [], + "title": "All processes network I/O", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 13, + "w": 24, + "x": 0, + "y": 92 + }, + "id": 29, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (container_network_receive_bytes_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (id)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "-> {{ id }}", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (rate (container_network_transmit_bytes_total{id!=\"/\",kubernetes_io_hostname=~\"^$Node$\",nc_region=~\"$region\"}[5m])) by (id)", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "<- {{ id }}", + "metric": "network", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "All processes network I/O (5m avg)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "kubernetes" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".+", + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".+", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(node_uname_info{nc_region=~\"$region\"}, hostname)", + "hide": 0, + "includeAll": true, + "label": "Node", + "multi": false, + "name": "Node", + "options": [], + "query": "label_values(node_uname_info{nc_region=~\"$region\"}, hostname)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-5m", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Container Metrics (cAdvisor)", + "uid": "container-metrics", + "version": 1 + } + coredns: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.3.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "A dashboard for the CoreDNS DNS server.", + "editable": false, + "overwrite": true, + "gnetId": 5926, + "graphTooltip": 0, + "id": 85, + "links": [], + "panels": [ + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 4, + "x": 0, + "y": 0 + }, + "id": 22, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "$$hashKey": "object:956", + "name": "value to text", + "value": 1 + }, + { + "$$hashKey": "object:957", + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "version", + "targets": [ + { + "expr": "coredns_build_info", + "format": "table", + "instant": true, + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "", + "title": "Version", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [], + "valueName": "first" + }, + { + "datasource": null, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 5 + }, + "id": 24, + "title": "Row title", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 6 + }, + "hiddenSeries": false, + "id": 1, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "total", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (proto)", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{proto}}", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m]))", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "total", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (total)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 6 + }, + "hiddenSeries": false, + "id": 12, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "total", + "yaxis": 2 + }, + { + "alias": "other", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (type)", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{type}}", + "refId": "A", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (by qtype)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 6 + }, + "hiddenSeries": false, + "id": 2, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "total", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (zone)", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{zone}}", + "refId": "A", + "step": 60 + }, + { + "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m]))", + "interval": "", + "intervalFactor": 2, + "legendFormat": "total", + "refId": "B", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (by zone)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 13 + }, + "hiddenSeries": false, + "id": 10, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "total", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_requests_do_count_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m]))", + "interval": "", + "intervalFactor": 2, + "legendFormat": "DO", + "refId": "A", + "step": 40 + }, + { + "expr": "sum(rate(coredns_dns_requests_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m]))", + "interval": "", + "intervalFactor": 2, + "legendFormat": "total", + "refId": "B", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (DO bit)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 13 + }, + "hiddenSeries": false, + "id": 9, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "tcp:90", + "yaxis": 2 + }, + { + "alias": "tcp:99 ", + "yaxis": 2 + }, + { + "alias": "tcp:50", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:99 ", + "refId": "A", + "step": 60 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:90", + "refId": "B", + "step": 60 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:50", + "refId": "C", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (size, udp)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 13 + }, + "hiddenSeries": false, + "id": 14, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "tcp:90", + "yaxis": 1 + }, + { + "alias": "tcp:99 ", + "yaxis": 1 + }, + { + "alias": "tcp:50", + "yaxis": 1 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto))", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{proto}}:99 ", + "refId": "A", + "step": 60 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:90", + "refId": "B", + "step": 60 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto))", + "intervalFactor": 2, + "legendFormat": "{{proto}}:50", + "refId": "C", + "step": 60 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Requests (size,tcp)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 20 + }, + "hiddenSeries": false, + "id": 5, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_dns_responses_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (rcode)", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{rcode}}", + "refId": "A", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Responses (by rcode)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 20 + }, + "hiddenSeries": false, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (le, job))", + "intervalFactor": 2, + "legendFormat": "99%", + "refId": "A", + "step": 40 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (le))", + "intervalFactor": 2, + "legendFormat": "90%", + "refId": "B", + "step": 40 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_request_duration_seconds_bucket{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (le))", + "intervalFactor": 2, + "legendFormat": "50%", + "refId": "C", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Responses (duration)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 27 + }, + "hiddenSeries": false, + "id": 8, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "udp:50%", + "yaxis": 1 + }, + { + "alias": "tcp:50%", + "yaxis": 2 + }, + { + "alias": "tcp:90%", + "yaxis": 2 + }, + { + "alias": "tcp:99%", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:99%", + "refId": "A", + "step": 40 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:90%", + "refId": "B", + "step": 40 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"udp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:50%", + "metric": "", + "refId": "C", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Responses (size, udp)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 27 + }, + "hiddenSeries": false, + "id": 13, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "udp:50%", + "yaxis": 1 + }, + { + "alias": "tcp:50%", + "yaxis": 1 + }, + { + "alias": "tcp:90%", + "yaxis": 1 + }, + { + "alias": "tcp:99%", + "yaxis": 1 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:99%", + "refId": "A", + "step": 40 + }, + { + "expr": "histogram_quantile(0.90, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le,proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:90%", + "refId": "B", + "step": 40 + }, + { + "expr": "histogram_quantile(0.50, sum(rate(coredns_dns_response_size_bytes_bucket{instance=~\"$instance\",proto=\"tcp\",nc_region=~\"$region\"}[5m])) by (le, proto)) ", + "intervalFactor": 2, + "legendFormat": "{{proto}}:50%", + "metric": "", + "refId": "C", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Responses (size, tcp)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 34 + }, + "hiddenSeries": false, + "id": 15, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(coredns_cache_entries{instance=~\"$instance\",nc_region=~\"$region\"}) by (type)", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{type}}", + "refId": "A", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cache (size)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 34 + }, + "hiddenSeries": false, + "id": 16, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pluginVersion": "7.4.5", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "misses", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(coredns_cache_hits_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (type)", + "intervalFactor": 2, + "legendFormat": "hits:{{type}}", + "refId": "A", + "step": 40 + }, + { + "expr": "sum(rate(coredns_cache_misses_total{instance=~\"$instance\",nc_region=~\"$region\"}[5m])) by (type)", + "intervalFactor": 2, + "legendFormat": "misses", + "refId": "B", + "step": 40 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cache (hitrate)", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "pps", + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "schemaVersion": 27, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "selected": false, + "text": "prometheus", + "value": "prometheus" + }, + "description": null, + "error": null, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".+", + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "description": null, + "error": null, + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": { + "query": "label_values(nc_region)", + "refId": "prometheus-region-Variable-Query" + }, + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "description": null, + "error": null, + "hide": 0, + "includeAll": true, + "label": "Instance", + "multi": false, + "name": "instance", + "options": [], + "query": { + "query": "up{job=\"coredns\",nc_region=~\"$region\"}", + "refId": "prometheus-instance-Variable-Query" + }, + "refresh": 1, + "regex": ".*instance=\"(.*?)\".*", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "now": true, + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "CoreDNS", + "uid": "coredns", + "version": 4 + } + kubernetes_etcd: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "etcd Grafana dashboard with Prometheus", + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 290, + "links": [], + "panels": [ + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 0 + }, + "id": 28, + "interval": null, + "isNew": true, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(etcd_server_has_leader{job=\"$cluster\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "metric": "etcd_server_has_leader", + "refId": "A", + "step": 20 + } + ], + "thresholds": "", + "title": "Up", + "type": "singlestat", + "valueFontSize": "200%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "gridPos": { + "h": 7, + "w": 10, + "x": 6, + "y": 0 + }, + "id": 23, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(grpc_server_started_total{job=\"$cluster\",grpc_type=\"unary\",nc_region=~\"$region\"}[5m]))", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "RPC Rate", + "metric": "grpc_server_started_total", + "refId": "A", + "step": 2 + }, + { + "expr": "sum(rate(grpc_server_handled_total{job=\"$cluster\",grpc_type=\"unary\",grpc_code!=\"OK\",nc_region=~\"$region\"}[5m]))", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "RPC Failed Rate", + "metric": "grpc_server_handled_total", + "refId": "B", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "RPC Rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ops", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 0 + }, + "id": 41, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum(grpc_server_started_total{job=\"$cluster\",grpc_service=\"etcdserverpb.Watch\",grpc_type=\"bidi_stream\",nc_region=~\"$region\"}) - sum(grpc_server_handled_total{job=\"$cluster\",grpc_service=\"etcdserverpb.Watch\",grpc_type=\"bidi_stream\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Watch Streams", + "metric": "grpc_server_handled_total", + "refId": "A", + "step": 4 + }, + { + "expr": "sum(grpc_server_started_total{job=\"$cluster\",grpc_service=\"etcdserverpb.Lease\",grpc_type=\"bidi_stream\",nc_region=~\"$region\"}) - sum(grpc_server_handled_total{job=\"$cluster\",grpc_service=\"etcdserverpb.Lease\",grpc_type=\"bidi_stream\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Lease Streams", + "metric": "grpc_server_handled_total", + "refId": "B", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Streams", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 7 + }, + "id": 1, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "etcd_mvcc_db_total_size_in_bytes{job=\"$cluster\",nc_region=~\"$region\"}", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{instance}} DB Size", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "DB Size", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 7 + }, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 1, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(etcd_disk_wal_fsync_duration_seconds_bucket{job=\"$cluster\",nc_region=~\"$region\"}[5m])) by (instance, le))", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{instance}} WAL fsync", + "metric": "etcd_disk_wal_fsync_duration_seconds_bucket", + "refId": "A", + "step": 4 + }, + { + "expr": "histogram_quantile(0.99, sum(rate(etcd_disk_backend_commit_duration_seconds_bucket{job=\"$cluster\",nc_region=~\"$region\"}[5m])) by (instance, le))", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}} DB fsync", + "metric": "etcd_disk_backend_commit_duration_seconds_bucket", + "refId": "B", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Disk Sync Duration", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 7 + }, + "id": 29, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "process_resident_memory_bytes{job=\"$cluster\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}} Resident Memory", + "metric": "process_resident_memory_bytes", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Memory", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 5, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 14 + }, + "id": 22, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(etcd_network_client_grpc_received_bytes_total{job=\"$cluster\",nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}} Client Traffic In", + "metric": "etcd_network_client_grpc_received_bytes_total", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Client Traffic In", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 5, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 14 + }, + "id": 21, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(etcd_network_client_grpc_sent_bytes_total{job=\"$cluster\",nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}} Client Traffic Out", + "metric": "etcd_network_client_grpc_sent_bytes_total", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Client Traffic Out", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 14 + }, + "id": 20, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(etcd_network_peer_received_bytes_total{job=\"$cluster\",nc_region=~\"$region\"}[5m])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}} Peer Traffic In", + "metric": "etcd_network_peer_received_bytes_total", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Peer Traffic In", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 14 + }, + "id": 16, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(etcd_network_peer_sent_bytes_total{job=\"$cluster\",nc_region=~\"$region\"}[5m])) by (instance)", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{instance}} Peer Traffic Out", + "metric": "etcd_network_peer_sent_bytes_total", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Peer Traffic Out", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 21 + }, + "id": 40, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(etcd_server_proposals_failed_total{job=\"$cluster\",nc_region=~\"$region\"}[5m]))", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Proposal Failure Rate", + "metric": "etcd_server_proposals_failed_total", + "refId": "A", + "step": 2 + }, + { + "expr": "sum(etcd_server_proposals_pending{job=\"$cluster\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Proposal Pending Total", + "metric": "etcd_server_proposals_pending", + "refId": "B", + "step": 2 + }, + { + "expr": "sum(rate(etcd_server_proposals_committed_total{job=\"$cluster\",nc_region=~\"$region\"}[5m]))", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Proposal Commit Rate", + "metric": "etcd_server_proposals_committed_total", + "refId": "C", + "step": 2 + }, + { + "expr": "sum(rate(etcd_server_proposals_applied_total{job=\"$cluster\",nc_region=~\"$region\"}[5m]))", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Proposal Apply Rate", + "refId": "D", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Raft Proposals", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "editable": true, + "error": false, + "fill": 0, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 21 + }, + "id": 19, + "isNew": true, + "legend": { + "alignAsTable": false, + "avg": false, + "current": false, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "changes(etcd_server_leader_changes_seen_total{job=\"$cluster\",nc_region=~\"$region\"}[1d])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{instance}} Total Leader Elections Per Day", + "metric": "etcd_server_leader_changes_seen_total", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Total Leader Elections Per Day", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "1m", + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 1, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(etcd_server_has_leader{nc_region=~\"$region\"}, job)", + "hide": 0, + "includeAll": false, + "label": "cluster", + "multi": false, + "name": "cluster", + "options": [], + "query": "label_values(etcd_server_has_leader{nc_region=~\"$region\"}, job)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "now": true, + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Kubernetes etcd", + "uid": "kubernetes-etcd", + "version": 5 + } + kubernetes_cluster_status: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 218, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 11, + "panels": [], + "repeat": null, + "title": "Cluster Health", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 0, + "y": 1 + }, + "id": 5, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(up{job=~\"apiserver|kube-scheduler|kube-controller-manager\",nc_region=~\"$region\"} == 0)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "1,3", + "title": "Control Plane UP", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "UP", + "value": "null" + } + ], + "valueName": "total" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 6, + "y": 1 + }, + "id": 6, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(ALERTS{alertstate=\"firing\",alertname!=\"DeadMansSwitch\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "3,5", + "title": "Alerts Firing", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 12, + "y": 1 + }, + "hideTimeOverride": false, + "id": 4, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "count(increase(kube_pod_container_status_restarts_total{nc_region=~\"$region\"}[1h]) > 5)", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "1,3", + "title": "Crashlooping Control Plane Pods", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 18, + "y": 1 + }, + "id": 1, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(up{job=\"apiserver\",nc_region=~\"$region\"} == 1) / count(up{job=\"apiserver\",nc_region=~\"$region\"})) * 100", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "50,80", + "title": "API Servers UP", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 5 + }, + "id": 13, + "panels": [], + "repeat": null, + "title": "Capacity Planing", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 6, + "x": 0, + "y": 6 + }, + "id": 8, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(100 - (avg by (instance) (rate(node_cpu_seconds_total{job=\"node-exporter\",mode=\"idle\"}[5m])) * 100)) / count(node_cpu_seconds_total{job=\"node-exporter\",mode=\"idle\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "80,90", + "title": "CPU Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 6, + "x": 6, + "y": 6 + }, + "id": 7, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "((sum(node_memory_MemTotal_bytes) - sum(node_memory_MemFree_bytes) - sum(node_memory_Buffers_bytes) - sum(node_memory_Cached_bytes)) / sum(node_memory_MemTotal_bytes)) * 100", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "80,90", + "title": "Memory Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 6, + "x": 12, + "y": 6 + }, + "id": 9, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(node_filesystem_size_bytes{device!=\"rootfs\",nc_region=~\"$region\"}) - sum(node_filesystem_free_bytes{device!=\"rootfs\",nc_region=~\"$region\"})) / sum(node_filesystem_size_bytes{device!=\"rootfs\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "80,90", + "title": "Filesystem Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 6, + "x": 18, + "y": 6 + }, + "id": 10, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "100 - (sum(kube_node_status_capacity{resource=\"pods\"}) by (nc_region) - sum(kube_pod_info) by (nc_region))/ sum(kube_node_status_capacity{resource=\"pods\"}) by (nc_region)* 100", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 600 + } + ], + "thresholds": "80,90", + "title": "Pod Utilization", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "fill": 1, + "gridPos": { + "h": 6, + "w": 6, + "x": 0, + "y": 11 + }, + "id": 17, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(kube_node_status_capacity{resource=\"cpu\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "allocatable", + "refId": "A" + }, + { + "expr": "sum(kube_node_status_allocatable{resource=\"cpu\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "capacity", + "refId": "B" + }, + { + "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "requested", + "refId": "C" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster CPU Capacity", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": null, + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "fill": 1, + "gridPos": { + "h": 6, + "w": 6, + "x": 6, + "y": 11 + }, + "id": 19, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(kube_node_status_allocatable{resource=\"memory\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "allocatable", + "refId": "A" + }, + { + "expr": "sum(kube_node_status_capacity{resource=\"memory\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "capacity", + "refId": "B" + }, + { + "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "requested", + "refId": "C" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Mem Capacity", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "fill": 1, + "gridPos": { + "h": 6, + "w": 6, + "x": 12, + "y": 11 + }, + "id": 21, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(node_filesystem_size_bytes{nc_region=~\"$region\"}) - sum(node_filesystem_free_bytes{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "usage", + "refId": "A" + }, + { + "expr": "sum(node_filesystem_size_bytes{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "limit", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Disk Capacity", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "fill": 1, + "gridPos": { + "h": 6, + "w": 6, + "x": 18, + "y": 11 + }, + "id": 15, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(kube_node_status_allocatable{resource=\"pods\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "allocatable", + "refId": "A" + }, + { + "expr": "sum(kube_node_status_capacity{resource=\"pods\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "capacity", + "refId": "B" + }, + { + "expr": "sum(kube_pod_info)", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "requested", + "refId": "C" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Pod Capacity", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "pods", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 17 + }, + "id": 37, + "panels": [], + "title": "Nodes", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 8, + "x": 0, + "y": 18 + }, + "id": 35, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_node_info)", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Number Of Nodes", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 8, + "x": 8, + "y": 18 + }, + "id": 39, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_node_status_condition{nnc_region=~\"$region\", condition=\"OutOfDisk\", status=\"true\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1", + "title": "Nodes Out of Disk", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 8, + "x": 16, + "y": 18 + }, + "id": 41, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_node_spec_unschedulable{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1", + "title": "Nodes Unavailable", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 21 + }, + "id": 25, + "panels": [], + "title": "Pods", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 5, + "x": 0, + "y": 22 + }, + "id": 23, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(78, 203, 42, 0.28)", + "full": false, + "lineColor": "#629e51", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Running\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Pods Running", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 5, + "x": 5, + "y": 22 + }, + "id": 27, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(78, 203, 42, 0.28)", + "full": false, + "lineColor": "#629e51", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Pending\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Pods Pending", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 5, + "x": 10, + "y": 22 + }, + "id": 29, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(78, 203, 42, 0.28)", + "full": false, + "lineColor": "#629e51", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Failed\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Pods Failed", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 5, + "x": 15, + "y": 22 + }, + "id": 31, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(78, 203, 42, 0.28)", + "full": false, + "lineColor": "#629e51", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Succeeded\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Pods Succeeded", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 4, + "x": 20, + "y": 22 + }, + "id": 33, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(78, 203, 42, 0.28)", + "full": false, + "lineColor": "#629e51", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_status_phase{nc_region=~\"$region\", phase=\"Unknown\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Pods Unknown", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 27 + }, + "id": 45, + "panels": [], + "title": "Containers", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 0, + "y": 28 + }, + "id": 43, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_container_status_running{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Containers Running", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 6, + "y": 28 + }, + "id": 47, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_container_status_waiting{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Containers Waiting", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 12, + "y": 28 + }, + "id": 49, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_container_status_terminated{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Containers Terminated", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 18, + "y": 28 + }, + "id": 51, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(delta(kube_pod_container_status_restarts_total{namespace!=\"kube-system\", nc_region=~\"$region\"}[30m]))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "", + "title": "Containers Restarts (Last 30 Minutes)", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 12, + "x": 0, + "y": 32 + }, + "id": 53, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "CPU Cores Requested by Containers", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "decbytes", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 12, + "x": 12, + "y": 32 + }, + "id": 55, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Memory Requested By Containers", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 36 + }, + "id": 59, + "panels": [], + "title": "Jobs", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 8, + "x": 0, + "y": 37 + }, + "id": 57, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_job_status_succeeded{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Jobs Succeeded", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 8, + "x": 8, + "y": 37 + }, + "id": 61, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_job_status_active{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Jobs Active", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "prometheus", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 8, + "x": 16, + "y": 37 + }, + "id": 63, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(kube_job_status_failed{nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Jobs Failed", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + } + ], + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".+", + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Kubernetes Cluster Status", + "uid": "kubernetes-cluster-status", + "version": 3 + } + nginx_stats: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "table", + "name": "Table", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + }, + { + "datasource": "${DS_PROMETHEUS}", + "enable": true, + "expr": "sum(changes(nginx_ingress_controller_config_last_reload_successful_timestamp_seconds{instance!=\"unknown\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",nc_region=~\"$region\"}[30s])) by (controller_class)", + "hide": false, + "iconColor": "rgba(255, 96, 96, 1)", + "limit": 100, + "name": "Config Reloads", + "showIn": 0, + "step": "30s", + "tagKeys": "controller_class", + "tags": [], + "titleFormat": "Config Reloaded", + "type": "tags" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 191, + "links": [], + "panels": [ + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "ops", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "id": 20, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "round(sum(irate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m])), 0.001)", + "format": "time_series", + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "", + "title": "Controller Request Volume", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 6, + "x": 6, + "y": 0 + }, + "id": 82, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(avg_over_time(nginx_ingress_controller_nginx_process_connections{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "instant": false, + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "", + "title": "Controller Connections", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "percentunit", + "gauge": { + "maxValue": 100, + "minValue": 80, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": false + }, + "gridPos": { + "h": 3, + "w": 6, + "x": 12, + "y": 0 + }, + "id": 21, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",status!~\"[4-5].*\",nc_region=~\"$region\"}[2m])) / sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "95, 99, 99.5", + "title": "Controller Success Rate (non-4|5xx responses)", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 3, + "x": 18, + "y": 0 + }, + "id": 81, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "avg(nginx_ingress_controller_success{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"})", + "format": "time_series", + "instant": true, + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "", + "title": "Config Reloads", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 3, + "x": 21, + "y": 0 + }, + "id": 83, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "count(nginx_ingress_controller_config_last_reload_successful{controller_pod=~\"$controller\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"} == 0)", + "format": "time_series", + "instant": true, + "intervalFactor": 1, + "refId": "A", + "step": 4 + } + ], + "thresholds": "", + "title": "Last Config Failed", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 3 + }, + "height": "200px", + "id": 86, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "hideEmpty": false, + "hideZero": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 300, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "repeat": null, + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "round(sum(irate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (ingress), 0.001)", + "format": "time_series", + "hide": false, + "instant": false, + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "metric": "network", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Ingress Request Volume", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "max - istio-proxy": "#890f02", + "max - master": "#bf1b00", + "max - prometheus": "#bf1b00" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": false, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 3 + }, + "id": 87, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "hideEmpty": true, + "hideZero": false, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "sideWidth": 300, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",ingress=~\"$ingress\",status!~\"[4-5].*\",nc_region=~\"$region\"}[2m])) by (ingress) / sum(rate(nginx_ingress_controller_requests{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",service_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (ingress)", + "format": "time_series", + "instant": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Ingress Success Rate (non-4|5xx responses)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 1, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percentunit", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 6, + "w": 8, + "x": 0, + "y": 10 + }, + "height": "200px", + "id": 32, + "isNew": true, + "legend": { + "alignAsTable": false, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (irate (nginx_ingress_controller_request_size_sum{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "instant": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "Received", + "metric": "network", + "refId": "A", + "step": 10 + }, + { + "expr": "- sum (irate (nginx_ingress_controller_response_size_sum{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "hide": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "Sent", + "metric": "network", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network I/O pressure", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "max - istio-proxy": "#890f02", + "max - master": "#bf1b00", + "max - prometheus": "#bf1b00" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": false, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 6, + "w": 8, + "x": 8, + "y": 10 + }, + "id": 77, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "sideWidth": 200, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "avg(nginx_ingress_controller_nginx_process_resident_memory_bytes{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}) ", + "format": "time_series", + "instant": false, + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "nginx", + "metric": "container_memory_usage:sort_desc", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Average Memory Usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "max - istio-proxy": "#890f02", + "max - master": "#bf1b00" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 3, + "editable": false, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 6, + "w": 8, + "x": 16, + "y": 10 + }, + "height": "", + "id": 79, + "isNew": true, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "sort": null, + "sortDesc": null, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum (rate (nginx_ingress_controller_nginx_process_cpu_seconds_total{controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",nc_region=~\"$region\"}[2m])) ", + "format": "time_series", + "interval": "10s", + "intervalFactor": 1, + "legendFormat": "nginx", + "metric": "container_cpu", + "refId": "A", + "step": 10 + } + ], + "thresholds": [ + { + "colorMode": "critical", + "fill": true, + "line": true, + "op": "gt" + } + ], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Average CPU Usage", + "tooltip": { + "msResolution": true, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "cores", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "columns": [], + "datasource": "${DS_PROMETHEUS}", + "fontSize": "100%", + "gridPos": { + "h": 8, + "w": 24, + "x": 0, + "y": 16 + }, + "hideTimeOverride": false, + "id": 75, + "links": [], + "options": {}, + "pageSize": 7, + "repeat": null, + "repeatDirection": "h", + "scroll": true, + "showHeader": true, + "sort": { + "col": 1, + "desc": true + }, + "styles": [ + { + "alias": "Ingress", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "ingress", + "preserveFormat": false, + "sanitize": false, + "thresholds": [], + "type": "string", + "unit": "short" + }, + { + "alias": "Requests", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Value #A", + "thresholds": [ + "" + ], + "type": "number", + "unit": "ops" + }, + { + "alias": "Errors", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Value #B", + "thresholds": [], + "type": "number", + "unit": "ops" + }, + { + "alias": "P50 Latency", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "link": false, + "pattern": "Value #C", + "thresholds": [], + "type": "number", + "unit": "dtdurations" + }, + { + "alias": "P90 Latency", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "pattern": "Value #D", + "thresholds": [], + "type": "number", + "unit": "dtdurations" + }, + { + "alias": "P99 Latency", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "pattern": "Value #E", + "thresholds": [], + "type": "number", + "unit": "dtdurations" + }, + { + "alias": "IN", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Value #F", + "thresholds": [ + "" + ], + "type": "number", + "unit": "Bps" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "pattern": "Time", + "thresholds": [], + "type": "hidden", + "unit": "short" + }, + { + "alias": "OUT", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "mappingType": 1, + "pattern": "Value #G", + "thresholds": [], + "type": "number", + "unit": "Bps" + } + ], + "targets": [ + { + "expr": "histogram_quantile(0.50, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (le, ingress))", + "format": "table", + "hide": false, + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "refId": "C" + }, + { + "expr": "histogram_quantile(0.90, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (le, ingress))", + "format": "table", + "hide": false, + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "refId": "D" + }, + { + "expr": "histogram_quantile(0.99, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (le, ingress))", + "format": "table", + "hide": false, + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{ destination_service }}", + "refId": "E" + }, + { + "expr": "sum(irate(nginx_ingress_controller_request_size_sum{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (ingress)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "refId": "F" + }, + { + "expr": "sum(irate(nginx_ingress_controller_response_size_sum{ingress!=\"\",controller_pod=~\"$controller\",controller_class=~\"$controller_class\",controller_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}[2m])) by (ingress)", + "format": "table", + "instant": true, + "intervalFactor": 1, + "legendFormat": "{{ ingress }}", + "refId": "G" + } + ], + "timeFrom": null, + "title": "Ingress Percentile Response Times and Transfer Rates", + "transform": "table", + "type": "table" + }, + { + "columns": [ + { + "text": "Current", + "value": "current" + } + ], + "datasource": "${DS_PROMETHEUS}", + "fontSize": "100%", + "gridPos": { + "h": 8, + "w": 24, + "x": 0, + "y": 24 + }, + "height": "1024", + "id": 85, + "links": [], + "options": {}, + "pageSize": 7, + "scroll": true, + "showHeader": true, + "sort": { + "col": 1, + "desc": false + }, + "styles": [ + { + "alias": "Time", + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "pattern": "Time", + "type": "date" + }, + { + "alias": "TTL", + "colorMode": "cell", + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "pattern": "Current", + "thresholds": [ + "0", + "691200" + ], + "type": "number", + "unit": "s" + }, + { + "alias": "", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "decimals": 2, + "pattern": "/.*/", + "thresholds": [], + "type": "number", + "unit": "short" + } + ], + "targets": [ + { + "expr": "avg(nginx_ingress_controller_ssl_expire_time_seconds{pod=~\"$controller\",service_namespace=~\"$namespace\",ingress=~\"$ingress\",nc_region=~\"$region\"}) by (host) - time()", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{ host }}", + "metric": "gke_letsencrypt_cert_expiration", + "refId": "A", + "step": 1 + } + ], + "title": "Ingress Certificate Expiry", + "transform": "timeseries_aggregations", + "type": "table" + } + ], + "refresh": "5s", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "nginx" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nginx_ingress_controller_config_hash{nc_region=~\"$region\"}, controller_namespace)", + "hide": 0, + "includeAll": true, + "label": "Namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(nginx_ingress_controller_config_hash{nc_region=~\"$region\"}, controller_namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": true, + "label": "Controller Class", + "multi": false, + "name": "controller_class", + "options": [], + "query": "label_values(nginx_ingress_controller_config_hash{service_namespace=~\"$namespace\",nc_region=~\"$region\"}, controller_class) ", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": true, + "label": "Controller", + "multi": false, + "name": "controller", + "options": [], + "query": "label_values(nginx_ingress_controller_config_hash{service_namespace=~\"$namespace\",controller_class=~\"$controller_class\",nc_region=~\"$region\"}, controller_pod) ", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": "$__all" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "label_values(nginx_ingress_controller_requests{service_namespace=~\"$namespace\",controller_class=~\"$controller_class\",controller=~\"$controller\",nc_region=~\"$region\"}, ingress) ", + "hide": 0, + "includeAll": true, + "label": "Ingress", + "multi": false, + "name": "ingress", + "options": [], + "query": "label_values(nginx_ingress_controller_requests{service_namespace=~\"$namespace\",controller_class=~\"$controller_class\",controller=~\"$controller\",nc_region=~\"$region\"}, ingress) ", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "2m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "NGINX Ingress controller", + "uid": "nginx", + "version": 3 + } + persistent-volume: |- + { + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 119, + "links": [], + "panels": [ + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "fill": 1, + "gridPos": { + "h": 9, + "w": 18, + "x": 0, + "y": 0 + }, + "id": 2, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": true, + "min": true, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "(sum without(instance, node) (kubelet_volume_stats_capacity_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"}) - sum without(instance, node) (kubelet_volume_stats_available_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"}))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Used Space ", + "refId": "A" + }, + { + "expr": "sum without(instance, node) (kubelet_volume_stats_available_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Free Space", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Volume Space Usage", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "datasource": "prometheus", + "gridPos": { + "h": 9, + "w": 6, + "x": 18, + "y": 0 + }, + "id": 5, + "links": [], + "options": { + "fieldOptions": { + "calcs": [ + "mean" + ], + "defaults": { + "max": 100, + "min": 0, + "unit": "percent" + }, + "mappings": [ + { + "from": "", + "id": 1, + "operator": "", + "text": "", + "to": "", + "type": 1, + "value": "" + } + ], + "override": {}, + "thresholds": [ + { + "color": "green", + "index": 0, + "value": null + }, + { + "color": "red", + "index": 1, + "value": 80 + } + ], + "values": false + }, + "orientation": "auto", + "showThresholdLabels": true, + "showThresholdMarkers": true + }, + "pluginVersion": "6.2.0", + "targets": [ + { + "expr": "(kubelet_volume_stats_capacity_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"} - kubelet_volume_stats_available_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"}) / kubelet_volume_stats_capacity_bytes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"} * 100", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + } + ], + "timeFrom": null, + "timeShift": null, + "title": "Volume Space Usage", + "type": "gauge" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "fill": 1, + "gridPos": { + "h": 9, + "w": 18, + "x": 0, + "y": 9 + }, + "id": 3, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": true, + "min": true, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum without(instance, node) (kubelet_volume_stats_inodes_used{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Used Space ", + "refId": "A" + }, + { + "expr": "(\n sum without(instance, node) (kubelet_volume_stats_inodes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"})\n -\n sum without(instance, node) (kubelet_volume_stats_inodes_used{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"})\n)", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{nc_region}} Free Space", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Volume inode Usage", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "datasource": "prometheus", + "gridPos": { + "h": 9, + "w": 6, + "x": 18, + "y": 9 + }, + "id": 6, + "links": [], + "options": { + "fieldOptions": { + "calcs": [ + "mean" + ], + "defaults": { + "max": 100, + "min": 0, + "unit": "percent" + }, + "mappings": [ + { + "from": "", + "id": 1, + "operator": "", + "text": "", + "to": "", + "type": 1, + "value": "" + } + ], + "override": {}, + "thresholds": [ + { + "color": "green", + "index": 0, + "value": null + }, + { + "color": "red", + "index": 1, + "value": 80 + } + ], + "values": false + }, + "orientation": "auto", + "showThresholdLabels": true, + "showThresholdMarkers": true + }, + "pluginVersion": "6.2.0", + "targets": [ + { + "expr": "kubelet_volume_stats_inodes_used{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"} / kubelet_volume_stats_inodes{job=\"kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\", nc_region=\"$region\"} * 100", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + } + ], + "timeFrom": null, + "timeShift": null, + "title": "Volume inode Usage", + "type": "gauge" + } + ], + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(kubelet_volume_stats_capacity_bytes{ job=\"kubelet\", nc_region=\"$region\"}, namespace)", + "hide": 0, + "includeAll": false, + "label": "Namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(kubelet_volume_stats_capacity_bytes{ job=\"kubelet\", nc_region=\"$region\"}, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(kubelet_volume_stats_capacity_bytes{ job=\"kubelet\", namespace=\"$namespace\"}, persistentvolumeclaim)", + "hide": 0, + "includeAll": false, + "label": "PersistentVolumeClaim", + "multi": false, + "name": "volume", + "options": [], + "query": "label_values(kubelet_volume_stats_capacity_bytes{ job=\"kubelet\", namespace=\"$namespace\"}, persistentvolumeclaim)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Kubernetes Persistent Volume", + "uid": "persistent-volume", + "version": 1 + } + elasticsearch: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Elasticsearch detailed dashboard", + "editable": false, + "overwrite": true, + "gnetId": 4358, + "graphTooltip": 1, + "id": 206, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 50, + "panels": [], + "repeat": null, + "title": "Cluster", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "#FADE2A", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 10, + "x": 0, + "y": 1 + }, + "height": "50", + "id": 8, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(elasticsearch_cluster_health_status{cluster=~\"$region\",color=\"green\",nc_region=~\"$region\"})*2)+sum(elasticsearch_cluster_health_status{cluster=~\"$region\",color=\"yellow\",nc_region=~\"$region\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 3, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "0,2", + "title": "Cluster health status", + "type": "singlestat", + "valueFontSize": "110%", + "valueMaps": [ + { + "op": "=", + "text": "GREEN", + "value": "2" + }, + { + "op": "=", + "text": "YELLOW", + "value": "1" + }, + { + "op": "=", + "text": "RED", + "value": "0" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 10, + "y": 1 + }, + "height": "50", + "id": 10, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(elasticsearch_cluster_health_number_of_nodes{cluster=~\"$region\",nc_region=~\"$region\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "Nodes", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 14, + "y": 1 + }, + "height": "50", + "id": 9, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_number_of_data_nodes{cluster=\"$region\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "Data nodes", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 6, + "x": 18, + "y": 1 + }, + "height": "50", + "hideTimeOverride": true, + "id": 16, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_number_of_pending_tasks{cluster=\"$region\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "metric": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "Pending tasks", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 4 + }, + "id": 51, + "panels": [], + "repeat": null, + "title": "Shards", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 0, + "y": 5 + }, + "height": "50", + "id": 11, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "repeat": "shard_type", + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_active_primary_shards{cluster=\"$region\",nc_region=~\"$region\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "active primary shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 4, + "y": 5 + }, + "height": "50", + "id": 39, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_active_shards{cluster=\"$region\",nc_region=~\"$region\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "active shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 8, + "y": 5 + }, + "height": "50", + "id": 40, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_initializing_shards{cluster=\"$region\",nc_region=~\"$region\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "initializing shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 12, + "y": 5 + }, + "height": "50", + "id": 41, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_relocating_shards{cluster=\"$region\",nc_region=~\"$region\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "relocating shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 3, + "w": 4, + "x": 16, + "y": 5 + }, + "height": "50", + "id": 42, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 6, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "elasticsearch_cluster_health_unassigned_shards{cluster=\"$region\",nc_region=~\"$region\"}", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 40 + } + ], + "thresholds": "", + "title": "unassigned shards", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 52, + "panels": [], + "repeat": null, + "title": "System", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 0, + "y": 9 + }, + "height": "400", + "id": 30, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_os_cpu_percent{cluster=\"$region\",es_master_node=\"true\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "instant": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - master", + "metric": "", + "refId": "A", + "step": 10 + }, + { + "expr": "elasticsearch_os_cpu_percent{cluster=\"$region\",es_data_node=\"true\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - data", + "metric": "", + "refId": "B", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "CPU usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percent", + "label": "CPU usage", + "logBase": 1, + "max": 100, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 6, + "y": 9 + }, + "height": "400", + "id": 31, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_jvm_memory_used_bytes{cluster=\"$region\",name=~\"$node\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - used: {{area}}", + "metric": "", + "refId": "A", + "step": 10 + }, + { + "expr": "elasticsearch_jvm_memory_committed_bytes{cluster=\"$region\",name=~\"$node\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - committed: {{area}}", + "refId": "B", + "step": 10 + }, + { + "expr": "elasticsearch_jvm_memory_max_bytes{cluster=\"$region\",name=~\"$node\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - max: {{area}}", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "JVM memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": "Memory", + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 12, + "y": 9 + }, + "height": "400", + "id": 32, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "1-(elasticsearch_filesystem_data_available_bytes{cluster=\"$region\",nc_region=~\"$region\"}/elasticsearch_filesystem_data_size_bytes{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - {{path}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [ + { + "colorMode": "custom", + "fill": true, + "fillColor": "rgba(216, 200, 27, 0.27)", + "op": "gt", + "value": 0.8 + }, + { + "colorMode": "custom", + "fill": true, + "fillColor": "rgba(234, 112, 112, 0.22)", + "op": "gt", + "value": 0.9 + } + ], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Disk usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percentunit", + "label": "Disk Usage %", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 18, + "y": 9 + }, + "height": "400", + "id": 47, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sort": "max", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "sent", + "transform": "negative-Y" + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_transport_tx_size_bytes_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} -sent", + "refId": "D", + "step": 10 + }, + { + "expr": "irate(elasticsearch_transport_rx_size_bytes_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} -received", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": "Bytes/sec", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "pps", + "label": "", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 19 + }, + "id": 53, + "panels": [], + "repeat": null, + "title": "Documents", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 0, + "y": 20 + }, + "height": "400", + "id": 1, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_indices_docs{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Documents count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Documents", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 6, + "y": 20 + }, + "height": "400", + "id": 24, + "interval": "", + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_indexing_index_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Documents indexed rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "index calls/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 12, + "y": 20 + }, + "height": "400", + "id": 25, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_docs_deleted{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Documents deleted rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Documents/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 18, + "y": 20 + }, + "height": "400", + "id": 26, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_merges_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Documents merged rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Documents/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 30 + }, + "id": 54, + "panels": [], + "repeat": null, + "title": "Total Operations stats", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 12, + "x": 0, + "y": 31 + }, + "height": "400", + "id": 48, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_indices_indexing_index_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - indexing", + "metric": "", + "refId": "A", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_search_query_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - query", + "refId": "B", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_search_fetch_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - fetch", + "refId": "C", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_merges_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - merges", + "refId": "D", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_refresh_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - refresh", + "refId": "E", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_flush_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - flush", + "refId": "F", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Total Operations rate", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Operations/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 12, + "x": 12, + "y": 31 + }, + "height": "400", + "id": 49, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_indices_indexing_index_time_seconds_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{ name }} - indexing", + "metric": "", + "refId": "A", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_search_query_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - query", + "refId": "B", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_search_fetch_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - fetch", + "refId": "C", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_merges_total_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - merges", + "refId": "D", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_refresh_total_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - refresh", + "refId": "E", + "step": 4 + }, + { + "expr": "irate(elasticsearch_indices_flush_time_ms_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ name }} - flush", + "refId": "F", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Total Operations time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ms", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 41 + }, + "id": 55, + "panels": [], + "repeat": null, + "title": "Times", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 8, + "x": 0, + "y": 42 + }, + "height": "400", + "id": 33, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_search_query_time_seconds{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval]) ", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Query time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ms", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 8, + "x": 8, + "y": 42 + }, + "height": "400", + "id": 5, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_indexing_index_time_seconds_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Indexing time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ms", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 8, + "x": 16, + "y": 42 + }, + "height": "400", + "id": 3, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_merges_total_time_seconds_total{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Merging time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 52 + }, + "id": 56, + "panels": [], + "repeat": null, + "title": "Caches", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 0, + "y": 53 + }, + "height": "400", + "id": 4, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_indices_fielddata_memory_size_bytes{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Field data memory size", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": "Memory", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 6, + "y": 53 + }, + "height": "400", + "id": 34, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_fielddata_evictions{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Field data evictions", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Evictions/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 12, + "y": 53 + }, + "height": "400", + "id": 35, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_indices_query_cache_memory_size_bytes{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Query cache size", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": "Size", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 6, + "x": 18, + "y": 53 + }, + "height": "400", + "id": 36, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_indices_query_cache_evictions{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Query cache evictions", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "Evictions/s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 63 + }, + "id": 57, + "panels": [], + "repeat": null, + "title": "Thread Pool", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 19, + "w": 6, + "x": 0, + "y": 64 + }, + "id": 45, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": " irate(elasticsearch_thread_pool_rejected_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{ type }}", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Thread Pool operations rejected", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 19, + "w": 6, + "x": 6, + "y": 64 + }, + "id": 46, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_thread_pool_active_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{ type }}", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Thread Pool operations queued", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 19, + "w": 6, + "x": 12, + "y": 64 + }, + "height": "", + "id": 43, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "elasticsearch_thread_pool_active_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{ type }}", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Thread Pool threads active", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 19, + "w": 6, + "x": 18, + "y": 64 + }, + "id": 44, + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": true, + "min": true, + "show": true, + "sort": "avg", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "irate(elasticsearch_thread_pool_completed_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{ type }}", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Thread Pool operations completed", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 83 + }, + "id": 58, + "panels": [], + "repeat": null, + "title": "JVM Garbage Collection", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 12, + "x": 0, + "y": 84 + }, + "height": "400", + "id": 7, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_jvm_gc_collection_seconds_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{gc}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "GC count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "GCs", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 10, + "w": 12, + "x": 12, + "y": 84 + }, + "height": "400", + "id": 27, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "hideEmpty": false, + "hideZero": false, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(elasticsearch_jvm_gc_collection_seconds_count{cluster=\"$region\",name=~\"$node\",nc_region=~\"$region\"}[$interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}} - {{gc}}", + "metric": "", + "refId": "A", + "step": 4 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "GC time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": "Time", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "30s", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "elasticsearch", + "App" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".+", + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + "text": "All", + "value": [ + "$__all" + ] + }, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(elasticsearch_process_cpu_percent{nc_region=~\"$region\"},name)", + "hide": 0, + "includeAll": true, + "label": "Node", + "multi": true, + "name": "node", + "options": [], + "query": "label_values(elasticsearch_process_cpu_percent{nc_region=~\"$region\"},name)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 1, + "tagValuesQuery": null, + "tags": [], + "tagsQuery": null, + "type": "query", + "useTags": false + }, + { + "auto": true, + "auto_count": 30, + "auto_min": "10s", + "current": { + "text": "1h", + "value": "1h" + }, + "hide": 0, + "label": "Interval", + "name": "interval", + "options": [ + { + "selected": false, + "text": "auto", + "value": "$__auto_interval_interval" + }, + { + "selected": false, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": true, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Elasticsearch", + "uid": "elasticsearch", + "version": 8 + } + fluentd: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 182, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 29, + "panels": [], + "title": "Buffer Overview", + "type": "row" + }, + { + "columns": [], + "datasource": "${DS_PROMETHEUS}", + "fontSize": "100%", + "gridPos": { + "h": 20, + "w": 12, + "x": 0, + "y": 1 + }, + "id": 27, + "links": [], + "options": {}, + "pageSize": null, + "pluginVersion": "6.2.0", + "scroll": true, + "showHeader": true, + "sort": { + "col": 1, + "desc": false + }, + "styles": [ + { + "alias": "Time", + "colorMode": null, + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 2, + "mappingType": 1, + "pattern": "Time", + "thresholds": [], + "type": "hidden", + "unit": "short" + }, + { + "alias": "local_elasticsearch", + "colorMode": "value", + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "mappingType": 1, + "pattern": "Value #A", + "thresholds": [ + "50", + "90" + ], + "type": "number", + "unit": "short" + }, + { + "alias": "centralized_logging", + "colorMode": "value", + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "mappingType": 1, + "pattern": "Value #B", + "thresholds": [ + "50", + "90" + ], + "type": "number", + "unit": "short" + }, + { + "alias": "dmaap", + "colorMode": "value", + "colors": [ + "rgba(245, 54, 54, 0.9)", + "rgba(237, 129, 40, 0.89)", + "rgba(50, 172, 45, 0.97)" + ], + "dateFormat": "YYYY-MM-DD HH:mm:ss", + "decimals": 0, + "mappingType": 1, + "pattern": "Value #C", + "thresholds": [ + "50", + "90" + ], + "type": "number", + "unit": "short" + } + ], + "targets": [ + { + "expr": "sum by (node) (fluentd_output_status_buffer_available_space_ratio{plugin_id=\"local_elasticsearch_output\",node=~\"$node\",nc_region=~\"$region\"})", + "format": "table", + "instant": true, + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + }, + { + "expr": "sum by (node) (fluentd_output_status_buffer_available_space_ratio{plugin_id=\"centralized_logging_output\",node=~\"$node\",nc_region=~\"$region\"})", + "format": "table", + "hide": false, + "instant": true, + "intervalFactor": 1, + "legendFormat": "", + "refId": "B" + }, + { + "expr": "sum by (node) (fluentd_output_status_buffer_available_space_ratio{plugin_id=\"dmaap_output\",node=~\"$node\",nc_region=~\"$region\"})", + "format": "table", + "hide": false, + "instant": true, + "intervalFactor": 1, + "legendFormat": "", + "refId": "C" + } + ], + "timeFrom": null, + "timeShift": null, + "title": "Remaining Buffer Space Available (%)", + "transform": "table", + "type": "table" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 1, + "fill": 0, + "gridPos": { + "h": 10, + "w": 12, + "x": 12, + "y": 1 + }, + "id": 23, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (node) (fluentd_output_status_buffer_queue_length{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Chunks Queued for $destination", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 0, + "format": "short", + "label": "Chunks in Buffer", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "description": "", + "fill": 0, + "gridPos": { + "h": 10, + "w": 12, + "x": 12, + "y": 11 + }, + "id": 34, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (node) (rate(fluentd_output_status_flush_time_count{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[5m]))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Time to Send a Chunk to $destination", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 0, + "format": "ms", + "label": "Flush Time", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 0, + "gridPos": { + "h": 10, + "w": 12, + "x": 0, + "y": 21 + }, + "id": 25, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "avg by (node) (fluentd_output_status_buffer_total_bytes{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Queue Size for $destination", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 2, + "format": "decbytes", + "label": "", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "description": "", + "fill": 0, + "gridPos": { + "h": 10, + "w": 12, + "x": 12, + "y": 21 + }, + "id": 36, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (node) (rate(fluentd_output_status_write_count{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[5m]))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Chunks Sent per Second to $destination", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 2, + "format": "short", + "label": "Chunks Sent per Second", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 0, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 31 + }, + "id": 22, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": false, + "min": true, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": false, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "avg by (node, plugin_id) (fluentd_output_status_buffer_available_space_ratio{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Remaining Buffer Space % for $destination", + "tooltip": { + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 0, + "format": "short", + "label": "Remaining Buffer Space (%)", + "logBase": 1, + "max": "100", + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 38 + }, + "id": 31, + "panels": [], + "title": "Errors and Retries", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "cacheTimeout": null, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "fill": 0, + "gridPos": { + "h": 8, + "w": 8, + "x": 0, + "y": 39 + }, + "id": 24, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (node) (rate(fluentd_output_status_num_errors{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Output Error Rate for $destination", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 2, + "format": "short", + "label": "Errors Per Second", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "cacheTimeout": null, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "fill": 0, + "gridPos": { + "h": 8, + "w": 8, + "x": 8, + "y": 39 + }, + "id": 35, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (node) (rate(fluentd_output_status_retry_count{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Output Retry Rate for $destination", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 2, + "format": "short", + "label": "Retries Per Second", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "cacheTimeout": null, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "fill": 0, + "gridPos": { + "h": 8, + "w": 8, + "x": 16, + "y": 39 + }, + "id": 37, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (node) (rate(fluentd_output_status_slow_flush_count{plugin_id=\"[[destination]]_output\",node=~\"$node\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Slow Flushes to $destination", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 2, + "format": "short", + "label": "Slow Flushes", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 47 + }, + "id": 15, + "panels": [], + "title": "Input / Output Statistics", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 0, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 48 + }, + "id": 12, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by ($aggregator) (rate(fluentd_read_count{node=~\"$node\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{$aggregator}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Message Input Rate by $aggregator on Node(s): $node", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 1, + "format": "short", + "label": "Lines Read Per Second", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 0, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 48 + }, + "id": 13, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "rightSide": true, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by ($aggregator) (rate([[destination]]_output_count{node=~\"$node\",nc_region=~\"$region\"}[2m]))", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{$aggregator}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Output Queuing Rate by $aggregator on Node(s): $node for $destination", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": 1, + "format": "short", + "label": "Lines Queued Per Second", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "30s", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "fluentd" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".+", + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".*", + "current": { + "text": "All", + "value": [ + "$__all" + ] + }, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(fluentd_read_count{nc_region=~\"$region\"},node)", + "hide": 0, + "includeAll": true, + "label": "Node", + "multi": true, + "name": "node", + "options": [], + "query": "label_values(fluentd_read_count{nc_region=~\"$region\"},node)", + "refresh": 1, + "regex": ".*r[\\d]{2}[co]{1}[\\d]{3}", + "skipUrlSync": false, + "sort": 1, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + "text": "local_elasticsearch", + "value": "local_elasticsearch" + }, + "hide": 0, + "includeAll": false, + "label": "Output Buffer", + "multi": false, + "name": "destination", + "options": [ + { + "selected": true, + "text": "local_elasticsearch", + "value": "local_elasticsearch" + }, + { + "selected": false, + "text": "centralized_logging", + "value": "centralized_logging" + }, + { + "selected": false, + "text": "dmaap", + "value": "dmaap" + } + ], + "query": "local_elasticsearch,centralized_logging,dmaap", + "skipUrlSync": false, + "type": "custom" + }, + { + "allValue": null, + "current": { + "text": "tag", + "value": "tag" + }, + "hide": 0, + "includeAll": false, + "label": "Group I/O Rate by Label", + "multi": false, + "name": "aggregator", + "options": [ + { + "selected": false, + "text": "node", + "value": "node" + }, + { + "selected": false, + "text": "region", + "value": "region" + }, + { + "selected": false, + "text": "node_fqdn", + "value": "node_fqdn" + }, + { + "selected": true, + "text": "tag", + "value": "tag" + }, + { + "selected": false, + "text": "index_prefix", + "value": "index_prefix" + } + ], + "query": "node,region,node_fqdn,tag,index_prefix", + "skipUrlSync": false, + "type": "custom" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Fluentd", + "uid": "fluentd", + "version": 2 + } + idrac: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Dashboard to get an overview of one server", + "editable": true, + "gnetId": null, + "graphTooltip": 0, + "id": 95, + "iteration": 1644114779535, + "links": [], + "panels": [ + { + "cacheTimeout": null, + "datasource": "${DS_PROMETHEUS}", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "id": 0, + "op": "=", + "text": "N/A", + "type": 1, + "value": "null" + }, + { + "id": 1, + "op": "=", + "text": "Not Synchronized", + "type": 1, + "value": "0" + }, + { + "id": 2, + "op": "=", + "text": "OK", + "type": 1, + "value": "1" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#d44a3a", + "value": null + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 0 + }, + { + "color": "#299c46", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 0, + "y": 0 + }, + "id": 20, + "interval": null, + "links": [], + "maxDataPoints": 100, + "options": { + "colorMode": "value", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "text": {}, + "textMode": "auto" + }, + "pluginVersion": "7.5.11", + "targets": [ + { + "expr": "idrac_licensestatus_ok{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + } + ], + "title": "iDRAC License Status for $node", + "transformations": [ + { + "id": "reduce", + "options": { + "reducers": [ + "lastNotNull" + ] + } + } + ], + "type": "stat" + }, + { + "datasource": "${DS_PROMETHEUS}", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "center", + "displayMode": "color-background", + "filterable": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "rgb(37, 48, 34)", + "value": null + }, + { + "color": "rgb(206, 14, 36)", + "value": 0 + }, + { + "color": "#EAB839", + "value": 480 + }, + { + "color": "light-green", + "value": 840 + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 8, + "w": 6, + "x": 6, + "y": 0 + }, + "id": 41, + "options": { + "showHeader": false + }, + "pluginVersion": "7.5.11", + "targets": [ + { + "expr": "idrac_sensors_tachometer{name=~\"System_Board_Fan[0-9]+\",nc_region=\"$region\",node=\"$node\"}", + "format": "table", + "interval": "", + "legendFormat": "{{name}}", + "queryType": "randomWalk", + "refId": "A" + } + ], + "title": "System fan for $node", + "transformations": [ + { + "id": "filterFieldsByName", + "options": { + "include": { + "names": [ + "name", + "Value" + ] + } + } + }, + { + "id": "groupBy", + "options": { + "fields": { + "Value": { + "aggregations": [ + "mean" + ], + "operation": "aggregate" + }, + "name": { + "aggregations": [], + "operation": "groupby" + } + } + } + } + ], + "type": "table" + }, + { + "cacheTimeout": null, + "datasource": "${DS_PROMETHEUS}", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "id": 0, + "op": "=", + "text": "N/A", + "type": 1, + "value": "null" + } + ], + "max": 60, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "rgba(50, 172, 45, 0.97)", + "value": null + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 43 + }, + { + "color": "rgba(245, 54, 54, 0.9)", + "value": 47 + } + ] + }, + "unit": "celsius" + }, + "overrides": [] + }, + "gridPos": { + "h": 8, + "w": 6, + "x": 12, + "y": 0 + }, + "id": 32, + "interval": null, + "links": [], + "maxDataPoints": 100, + "options": { + "orientation": "horizontal", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showThresholdLabels": true, + "showThresholdMarkers": true, + "text": {} + }, + "pluginVersion": "7.5.11", + "targets": [ + { + "expr": "idrac_inlet_temp_in_celsius{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 60, + "target": "" + } + ], + "title": "Inlet temperature of $node", + "transformations": [ + { + "id": "reduce", + "options": { + "reducers": [ + "lastNotNull" + ] + } + } + ], + "type": "gauge" + }, + { + "cacheTimeout": null, + "datasource": "${DS_PROMETHEUS}", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "id": 0, + "op": "=", + "text": "N/A", + "type": 1, + "value": "null" + } + ], + "max": 100, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "rgba(50, 172, 45, 0.97)", + "value": null + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 75 + }, + { + "color": "rgba(245, 54, 54, 0.9)", + "value": 80 + } + ] + }, + "unit": "celsius" + }, + "overrides": [] + }, + "gridPos": { + "h": 8, + "w": 6, + "x": 18, + "y": 0 + }, + "id": 7, + "interval": null, + "links": [], + "maxDataPoints": 100, + "options": { + "orientation": "horizontal", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showThresholdLabels": true, + "showThresholdMarkers": true, + "text": {} + }, + "pluginVersion": "7.5.11", + "targets": [ + { + "expr": "idrac_exhaust_temp_in_celsius{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 60, + "target": "" + } + ], + "title": "Exhaust temperature of $node", + "transformations": [ + { + "id": "reduce", + "options": { + "reducers": [ + "lastNotNull" + ] + } + } + ], + "type": "gauge" + }, + { + "datasource": "${DS_PROMETHEUS}", + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "align": "center", + "displayMode": "auto", + "filterable": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "rgb(0, 0, 0)", + "value": null + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 0, + "y": 4 + }, + "id": 45, + "interval": null, + "options": { + "showHeader": true + }, + "pluginVersion": "7.5.11", + "targets": [ + { + "exemplar": true, + "expr": "idrac_sensors_volts{name=~\"PS[0-9]+_Voltage_[0-9]+\",nc_region=\"$region\",node=\"$node\"}", + "format": "table", + "interval": "", + "legendFormat": "{{name}}", + "queryType": "randomWalk", + "refId": "A" + } + ], + "title": "Power supply for $node", + "transformations": [ + { + "id": "filterFieldsByName", + "options": { + "include": { + "names": [ + "name", + "health_state" + ] + } + } + }, + { + "id": "organize", + "options": { + "excludeByName": {}, + "indexByName": { + "health_state": 1, + "name": 0 + }, + "renameByName": { + "health_state": "Health Status", + "name": "Name" + } + } + }, + { + "id": "groupBy", + "options": { + "fields": { + "Health Status": { + "aggregations": [ + "last" + ], + "operation": "aggregate" + }, + "Name": { + "aggregations": [], + "operation": "groupby" + } + } + } + } + ], + "type": "table" + }, + { + "collapsed": false, + "datasource": null, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 38, + "panels": [], + "title": "Selected node metric", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fieldConfig": { + "defaults": { + "unit": "volt" + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "node_memory_SwapFree{instance=\"$server\",job=\"prometheus\"}" + }, + "properties": [ + { + "id": "unit", + "value": "short" + } + ] + } + ] + }, + "fill": 1, + "fillGradient": 0, + "gridPos": { + "h": 7, + "w": 23, + "x": 0, + "y": 9 + }, + "hiddenSeries": false, + "id": 33, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "7.5.11", + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "idrac_sensors_volts{name=~\"PS[0-9]+_Voltage_[0-9]+\",nc_region=\"$region\",node=\"$node\"}", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "{{name}}", + "metric": "", + "refId": "C", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Power supply for $node", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "$$hashKey": "object:1686", + "format": "volt", + "label": null, + "logBase": 1, + "max": null, + "min": "90", + "show": true + }, + { + "$$hashKey": "object:1687", + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "datasource": "${DS_PROMETHEUS}", + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "drawStyle": "line", + "fillOpacity": 13, + "gradientMode": "opacity", + "hideFrom": { + "graph": false, + "legend": false, + "tooltip": false + }, + "lineInterpolation": "linear", + "lineStyle": { + "fill": "solid" + }, + "lineWidth": 2, + "pointSize": 6, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "auto", + "spanNulls": false + }, + "mappings": [], + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": null + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "celsius" + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "node_memory_SwapFree{instance=\"$server\",job=\"prometheus\"}" + }, + "properties": [ + { + "id": "unit", + "value": "short" + } + ] + } + ] + }, + "gridPos": { + "h": 7, + "w": 23, + "x": 0, + "y": 16 + }, + "id": 4, + "links": [], + "options": { + "graph": {}, + "legend": { + "calcs": [], + "displayMode": "list", + "placement": "bottom" + }, + "tooltipOptions": { + "mode": "single" + } + }, + "pluginVersion": "7.4.5", + "targets": [ + { + "expr": "idrac_inlet_temp_in_celsius{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "inlet temp", + "metric": "", + "refId": "C", + "step": 10 + }, + { + "expr": "idrac_exhaust_temp_in_celsius{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "exhaust temp", + "metric": "", + "refId": "E", + "step": 10 + } + ], + "timeFrom": null, + "timeShift": null, + "title": "Temperature for $node", + "type": "timeseries" + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fieldConfig": { + "defaults": { + "unit": "rotrpm" + }, + "overrides": [] + }, + "fill": 1, + "fillGradient": 0, + "grid": {}, + "gridPos": { + "h": 8, + "w": 23, + "x": 0, + "y": 23 + }, + "hiddenSeries": false, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "7.5.11", + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "idrac_sensors_tachometer{nc_region=\"$region\",node=\"$node\",name=~\"System_Board_Fan[0-9]+\"}", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 10, + "legendFormat": "{{name}}", + "refId": "A", + "step": 50 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Fan speed for $node", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "$$hashKey": "object:2909", + "format": "rotrpm", + "label": "Fan speed", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "$$hashKey": "object:2910", + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "datasource": null, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 31 + }, + "id": 14, + "panels": [], + "title": "All Node iDrac metrics", + "type": "row" + }, + { + "datasource": "${DS_PROMETHEUS}", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "center", + "displayMode": "color-background", + "filterable": true + }, + "mappings": [ + { + "from": "", + "id": 1, + "text": "OK", + "to": "", + "type": 1, + "value": "1" + }, + { + "from": "", + "id": 2, + "text": "EXPIRED", + "to": "", + "type": 1, + "value": "0" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "rgb(37, 48, 34)", + "value": null + }, + { + "color": "semi-dark-red", + "value": 0 + }, + { + "color": "light-green", + "value": 1 + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 32 + }, + "id": 36, + "options": { + "showHeader": true, + "sortBy": [] + }, + "pluginVersion": "7.5.11", + "targets": [ + { + "exemplar": true, + "expr": "idrac_licensestatus_ok{nc_region=\"$region\"}", + "format": "table", + "instant": false, + "interval": "", + "legendFormat": "", + "queryType": "randomWalk", + "refId": "A" + } + ], + "timeFrom": "1d", + "title": "License status per Node", + "transformations": [ + { + "id": "filterFieldsByName", + "options": { + "include": { + "names": [ + "node", + "Value #A", + "name" + ] + } + } + }, + { + "id": "organize", + "options": { + "excludeByName": {}, + "indexByName": {}, + "renameByName": { + "Value #A": "Status", + "name": "License Name", + "node": "Node" + } + } + }, + { + "id": "groupBy", + "options": { + "fields": { + "License Name": { + "aggregations": [ + "last" + ], + "operation": "aggregate" + }, + "Node": { + "aggregations": [], + "operation": "groupby" + }, + "Status": { + "aggregations": [ + "last" + ], + "operation": "aggregate" + } + } + } + } + ], + "type": "table" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$DS_PROMETHEUS", + "fieldConfig": { + "defaults": { + "unit": "celsius" + }, + "overrides": [] + }, + "fill": 1, + "fillGradient": 0, + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 39 + }, + "hiddenSeries": false, + "id": 12, + "interval": "", + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "maxPerRow": 2, + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "7.5.11", + "pointradius": 2, + "points": false, + "renderer": "flot", + "repeat": null, + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "idrac_inlet_temp_in_celsius{nc_region=\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": "1w", + "timeRegions": [], + "timeShift": null, + "title": "Inlet temperature of all nodes in $region", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "$$hashKey": "object:2130", + "format": "celsius", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "$$hashKey": "object:2131", + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$DS_PROMETHEUS", + "fieldConfig": { + "defaults": { + "unit": "celsius" + }, + "overrides": [] + }, + "fill": 1, + "fillGradient": 0, + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 49 + }, + "hiddenSeries": false, + "id": 43, + "interval": "", + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "maxPerRow": 2, + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "7.5.11", + "pointradius": 2, + "points": false, + "renderer": "flot", + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "idrac_exhaust_temp_in_celsius{nc_region=\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": "1w", + "timeRegions": [], + "timeShift": null, + "title": "Exhaust temperature of all nodes in $region", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "$$hashKey": "object:2130", + "format": "celsius", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "$$hashKey": "object:2131", + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$DS_PROMETHEUS", + "fieldConfig": { + "defaults": { + "unit": "volt" + }, + "overrides": [] + }, + "fill": 1, + "fillGradient": 0, + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 59 + }, + "hiddenSeries": false, + "id": 42, + "interval": "", + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "hideEmpty": true, + "hideZero": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "maxPerRow": 2, + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "7.5.11", + "pointradius": 2, + "points": false, + "renderer": "flot", + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "exemplar": true, + "expr": "idrac_sensors_volts{name=~\"PS[0-9]+_Voltage_[0-9]+\",nc_region=\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{node}} {{name}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": "1w", + "timeRegions": [], + "timeShift": null, + "title": "Power supply of all nodes in $region", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "$$hashKey": "object:2130", + "format": "volt", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "$$hashKey": "object:2131", + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$DS_PROMETHEUS", + "fieldConfig": { + "defaults": { + "unit": "rotrpm" + }, + "overrides": [] + }, + "fill": 1, + "fillGradient": 0, + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 69 + }, + "hiddenSeries": false, + "id": 44, + "interval": "", + "legend": { + "alignAsTable": true, + "avg": true, + "current": false, + "hideEmpty": true, + "hideZero": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "maxPerRow": 2, + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "7.5.11", + "pointradius": 2, + "points": false, + "renderer": "flot", + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "exemplar": true, + "expr": "idrac_sensors_tachometer{nc_region=\"$region\",name=~\"System_Board_Fan[0-9]+\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{node}} {{name}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": "1w", + "timeRegions": [], + "timeShift": null, + "title": "Fan speed of all nodes in $region", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "$$hashKey": "object:2130", + "format": "rotrpm", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "$$hashKey": "object:2131", + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 27, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "selected": false, + "text": "prometheus", + "value": "prometheus" + }, + "description": null, + "error": null, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "queryValue": "", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "description": null, + "error": null, + "hide": 0, + "includeAll": false, + "label": "Region", + "multi": false, + "name": "region", + "options": [], + "query": { + "query": "label_values(nc_region)", + "refId": "prometheus-region-Variable-Query" + }, + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "label_values(node_uname_info{nc_region=\"$region\"}, node)", + "description": null, + "error": null, + "hide": 0, + "includeAll": false, + "label": "Node", + "multi": false, + "name": "node", + "options": [], + "query": { + "query": "label_values(node_uname_info{nc_region=\"$region\"}, node)", + "refId": "prometheus-node-Variable-Query" + }, + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "IDRAC", + "uid": "7AovVvank", + "version": 1 + } + named_processes: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Process metrics exported by https://github.com/ncabatoff/process-exporter.", + "editable": false, + "gnetId": 249, + "graphTooltip": 1, + "id": 77, + "links": [ + { + "asDropdown": true, + "icon": "external link", + "includeVars": true, + "keepTime": true, + "tags": [ + "OS" + ], + "title": "OS", + "type": "dashboards" + } + ], + "panels": [ + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 0 + }, + "id": 1, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "namedprocess_namegroup_num_procs{groupname=~\"$processes\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{groupname}} - {{hostname}}", + "metric": "process_namegroup_num_procs", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "num processes", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 0 + }, + "id": 2, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(namedprocess_namegroup_cpu_system_seconds_total{groupname=~\"$processes\", nc_region=\"$nc_region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{groupname}} - {{hostname}}", + "metric": "process_namegroup_cpu_seconds_total", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "cpu", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 7 + }, + "id": 3, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(namedprocess_namegroup_read_bytes_total{groupname=~\"$processes\", nc_region=\"$nc_region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{groupname}} - {{hostname}}", + "metric": "namedprocess_namegroup_read_bytes_total", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "read bytes", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 7 + }, + "id": 4, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(namedprocess_namegroup_write_bytes_total{groupname=~\"$processes\", nc_region=\"$nc_region\"}[$interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{groupname}} - {{hostname}}", + "metric": "namedprocess_namegroup_read_bytes_total", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "write bytes", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "Bps", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 14 + }, + "id": 5, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "namedprocess_namegroup_memory_bytes{groupname=~\"$processes\", memtype=\"resident\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{groupname}} - {{hostname}}", + "metric": "namedprocess_namegroup_memory_bytes", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "resident memory", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 14 + }, + "id": 6, + "isNew": true, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "namedprocess_namegroup_memory_bytes{groupname=~\"$processes\", memtype=\"virtual\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{groupname}} - {{hostname}}", + "metric": "namedprocess_namegroup_memory_bytes", + "refId": "A", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "virtual memory", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "1m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "OS" + ], + "templating": { + "list": [ + { + "auto": false, + "auto_count": 30, + "auto_min": "10s", + "current": { + "text": "10m", + "value": "10m" + }, + "datasource": null, + "hide": 0, + "includeAll": false, + "label": "", + "multi": false, + "name": "interval", + "options": [ + { + "selected": false, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "5m", + "value": "5m" + }, + { + "selected": true, + "text": "10m", + "value": "10m" + }, + { + "selected": false, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,5m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + }, + { + "allValue": ".+", + "current": { + "selected": false, + "tags": [], + "text": "All", + "value": [ + "$__all" + ] + }, + "datasource": "prometheus", + "definition": "label_values(groupname)", + "hide": 0, + "includeAll": true, + "label": null, + "multi": true, + "name": "processes", + "options": [], + "query": "label_values(groupname)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "prometheus", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC_Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 1, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Named Processes", + "uid": "named-processes", + "version": 1 + } + nodes: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Dashboard to get an overview of one server", + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 128, + "links": [], + "panels": [ + { + "cacheTimeout": null, + "colorBackground": false, + "colorPrefix": true, + "colorValue": true, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 0, + "y": 0 + }, + "id": 30, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "$node =", + "prefixFontSize": "70%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "node_ntp_leap{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,3", + "timeFrom": null, + "timeShift": null, + "title": "Leap Second Status", + "type": "singlestat", + "valueFontSize": "70%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + }, + { + "op": "=", + "text": "OK", + "value": "0" + }, + { + "op": "=", + "text": "add leap second at UTC midnight", + "value": "1" + }, + { + "op": "=", + "text": "delete leap second at UTC midnight", + "value": "2" + }, + { + "op": "=", + "text": "unsynchronised", + "value": "3" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 4, + "y": 0 + }, + "id": 18, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "$node =", + "prefixFontSize": "70%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "sum(node_timex_pps_jitter_total{node=~\"$node\", nc_region=\"$region\"})", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Jitter Count", + "type": "singlestat", + "valueFontSize": "70%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "total" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 8, + "y": 0 + }, + "id": 31, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "$node =", + "prefixFontSize": "70%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "node_ntp_stratum{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "", + "title": "Stratum", + "type": "singlestat", + "valueFontSize": "70%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": true, + "thresholdMarkers": true + }, + "gridPos": { + "h": 8, + "w": 6, + "x": 12, + "y": 0 + }, + "id": 5, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "100 * (1 - (node_memory_MemFree_bytes{hostname=\"$node\", nc_region=\"$region\"} + node_memory_Buffers_bytes{hostname=\"$node\", nc_region=\"$region\"} + node_memory_Cached_bytes{hostname=\"$node\", nc_region=\"$region\"}) / (node_memory_MemTotal_bytes{hostname=\"$node\", nc_region=\"$region\"} - (node_memory_HugePages_Total{hostname=\"$node\", nc_region=\"$region\"} * node_memory_Hugepagesize_bytes{hostname=\"$node\", nc_region=\"$region\"})))", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 60, + "target": "" + } + ], + "thresholds": "80, 90", + "title": "Memory usage of $host excluding the Hugepages", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "percentunit", + "gauge": { + "maxValue": 1, + "minValue": 0, + "show": true, + "thresholdLabels": true, + "thresholdMarkers": true + }, + "gridPos": { + "h": 8, + "w": 6, + "x": 18, + "y": 0 + }, + "id": 7, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(sum(node_filesystem_size_bytes{device!~\"tmpfs|shm\",node=\"$node\", nc_region=\"$region\"}) - sum(node_filesystem_free_bytes{device!~\"tmpfs|shm\",node=\"$node\", nc_region=\"$region\"})) / sum(node_filesystem_size_bytes{device!~\"tmpfs|shm\",node=\"$node\", nc_region=\"$region\"})", + "format": "time_series", + "intervalFactor": 2, + "refId": "A", + "step": 60, + "target": "" + } + ], + "thresholds": "0.75, 0.90", + "title": "Disk space usage of $host", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorPrefix": true, + "colorValue": true, + "colors": [ + "#d44a3a", + "rgba(237, 129, 40, 0.89)", + "#299c46" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 0, + "y": 4 + }, + "id": 20, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "$node =", + "prefixFontSize": "70%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "node_timex_sync_status{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "0,1", + "title": "Clock_Synchronization", + "type": "singlestat", + "valueFontSize": "70%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + }, + { + "op": "=", + "text": "Not Synchronized", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorPostfix": false, + "colorPrefix": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 4, + "y": 4 + }, + "id": 22, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "/ms", + "postfixFontSize": "50%", + "prefix": "$node =", + "prefixFontSize": "70%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": true, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "node_ntp_sanity{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Sanity Check", + "type": "singlestat", + "valueFontSize": "70%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 16, + "panels": [], + "title": "NTP Status", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 2, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 9 + }, + "id": 24, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "node_ntp_root_delay_seconds{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Node_ntp_root_delay_seconds", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 9 + }, + "id": 9, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "node_load1{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 4, + "legendFormat": "load 1m", + "refId": "A", + "step": 20, + "target": "" + }, + { + "expr": "node_load5{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 4, + "legendFormat": "load 5m", + "refId": "B", + "step": 20, + "target": "" + }, + { + "expr": "node_load15{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 4, + "legendFormat": "load 15m", + "refId": "C", + "step": 20, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "System load", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percentunit", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 2, + "gridPos": { + "h": 8, + "w": 12, + "x": 0, + "y": 16 + }, + "id": 26, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "node_timex_pps_jitter_seconds{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "node_timex_pps_jitter_seconds", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 8, + "w": 12, + "x": 12, + "y": 16 + }, + "id": 28, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "node_ntp_offset_seconds{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "node_ntp_offset_seconds", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 24 + }, + "id": 14, + "panels": [], + "title": "Node Status", + "type": "row" + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 8, + "w": 23, + "x": 0, + "y": 25 + }, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "100 - (avg by (cpu) (irate(node_cpu_seconds_total{mode=\"idle\", nc_region=~\"$region\", node=\"$node\"}[1h])) * 100)", + "format": "time_series", + "hide": false, + "intervalFactor": 10, + "legendFormat": "", + "refId": "A", + "step": 50 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Idle cpu", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percent", + "label": "cpu usage", + "logBase": 1, + "max": 100, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 23, + "x": 0, + "y": 33 + }, + "id": 4, + "legend": { + "alignAsTable": false, + "avg": false, + "current": false, + "hideEmpty": false, + "hideZero": false, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "node_memory_SwapFree{instance=\"$server\",job=\"prometheus\"}", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "node_memory_MemTotal_bytes{node=\"$node\", nc_region=\"$region\"} - node_memory_MemFree_bytes{node=\"$node\", nc_region=\"$region\"} - node_memory_Buffers_bytes{node=\"$node\", nc_region=\"$region\"} - node_memory_Cached_bytes{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "memory used", + "metric": "", + "refId": "C", + "step": 10 + }, + { + "expr": "node_memory_Buffers_bytes{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "memory buffers", + "metric": "", + "refId": "E", + "step": 10 + }, + { + "expr": "node_memory_Cached_bytes{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "memory cached", + "metric": "", + "refId": "F", + "step": 10 + }, + { + "expr": "node_memory_MemFree_bytes{node=\"$node\", nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "memory free", + "metric": "", + "refId": "D", + "step": 10 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Memory usage", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 23, + "x": 0, + "y": 40 + }, + "id": 6, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "read", + "yaxis": 1 + }, + { + "alias": "{instance=\"$server\"}", + "yaxis": 2 + }, + { + "alias": "io time", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (instance) (rate(node_disk_read_bytes_total{node=\"$node\", nc_region=\"$region\"}[1h]))", + "format": "time_series", + "hide": false, + "intervalFactor": 4, + "legendFormat": "read", + "refId": "A", + "step": 20, + "target": "" + }, + { + "expr": "sum by (instance) (rate(node_disk_written_bytes_total{node=\"$node\", nc_region=\"$region\"}[1h]))", + "format": "time_series", + "intervalFactor": 4, + "legendFormat": "written", + "refId": "B", + "step": 20 + }, + { + "expr": "sum by (instance) (rate(node_disk_io_time_seconds_total{node=\"$node\", nc_region=\"$region\"}[1h]))", + "format": "time_series", + "intervalFactor": 4, + "legendFormat": "io time", + "refId": "C", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Disk I/O", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 9, + "w": 23, + "x": 0, + "y": 47 + }, + "id": 8, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "transmitted ", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(node_network_receive_bytes_total{node=\"$node\", nc_region=\"$region\",device!~\"lo\"}[5m])", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{device}}", + "refId": "A", + "step": 10, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network received", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "alerting": {}, + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 8, + "w": 23, + "x": 0, + "y": 56 + }, + "id": 10, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "transmitted ", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(node_network_transmit_bytes_total{node=\"$node\", nc_region=\"$region\", device!~\"lo\"}[5m])", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{device}}", + "refId": "B", + "step": 10, + "target": "" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Network transmitted", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$DS_PROMETHEUS", + "fill": 1, + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 64 + }, + "id": 12, + "interval": "", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "rightSide": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "dbus_serial{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{node}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": "1w", + "timeRegions": [], + "timeShift": null, + "title": "systemd_dbus_serial", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "label_values(node_uname_info{nc_region=\"$region\"}, node)", + "hide": 0, + "includeAll": false, + "label": "Node", + "multi": false, + "name": "node", + "options": [], + "query": "label_values(node_uname_info{nc_region=\"$region\"}, node)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Nodes Status", + "uid": "nodes-status", + "version": 7 + } + prometheus: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "Prometheus which you want to monitor", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "" + }, + { + "type": "panel", + "id": "text", + "name": "Text", + "version": "" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + }, + { + "datasource": "${DS_PROMETHEUS}", + "enable": true, + "expr": "count(sum(up{instance=\"$instance\",nc_region=~\"$region\"}) by (instance) < 1)", + "hide": false, + "iconColor": "rgb(250, 44, 18)", + "limit": 100, + "name": "downage", + "showIn": 0, + "step": "30s", + "tagKeys": "instance", + "textFormat": "prometheus down", + "titleFormat": "Downage", + "type": "alert" + }, + { + "datasource": "${DS_PROMETHEUS}", + "enable": true, + "expr": "sum(changes(prometheus_config_last_reload_success_timestamp_seconds[10m])) by (instance)", + "hide": false, + "iconColor": "#fceaca", + "limit": 100, + "name": "Reload", + "showIn": 0, + "step": "5m", + "tagKeys": "instance", + "tags": [], + "titleFormat": "Reload", + "type": "tags" + } + ] + }, + "description": "Dashboard for monitoring of Prometheus v2.x.x", + "editable": false, + "overwrite": true, + "gnetId": 3681, + "graphTooltip": 1, + "id": 224, + "links": [ + { + "icon": "info", + "tags": [], + "targetBlank": true, + "title": "Dashboard's Github ", + "tooltip": "Github repo of this dashboard", + "type": "link", + "url": "https://github.com/FUSAKLA/Prometheus2-grafana-dashboard" + }, + { + "icon": "doc", + "tags": [], + "targetBlank": true, + "title": "Prometheus Docs", + "tooltip": "", + "type": "link", + "url": "http://prometheus.io/docs/introduction/overview/" + } + ], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 53, + "panels": [], + "repeat": null, + "title": "Header instance info", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#bf1b00" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 1, + "format": "s", + "gauge": { + "maxValue": 1000000, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 41, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "time() - process_start_time_seconds{instance=\"$instance\",nc_region=~\"$region\"}", + "format": "time_series", + "instant": false, + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "", + "title": "Uptime", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#bf1b00" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "short", + "gauge": { + "maxValue": 1000000, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 8, + "x": 4, + "y": 1 + }, + "id": 42, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "expr": "prometheus_tsdb_head_series{instance=\"$instance\",nc_region=~\"$region\"}", + "format": "time_series", + "instant": false, + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "500000,800000,1000000", + "title": "Total count of time series", + "type": "singlestat", + "valueFontSize": "150%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 4, + "x": 12, + "y": 1 + }, + "id": 48, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "version", + "targets": [ + { + "expr": "prometheus_build_info{instance=\"$instance\",nc_region=~\"$region\"}", + "format": "table", + "instant": true, + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "", + "title": "Version", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "format": "ms", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 4, + "x": 16, + "y": 1 + }, + "id": 49, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "prometheus_tsdb_head_max_time{instance=\"$instance\",nc_region=~\"$region\"} - prometheus_tsdb_head_min_time{instance=\"$instance\",nc_region=~\"$region\"}", + "format": "time_series", + "instant": true, + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "", + "title": "Actual head block length", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "content": "", + "gridPos": { + "h": 5, + "w": 2, + "x": 20, + "y": 1 + }, + "height": "", + "id": 50, + "links": [], + "mode": "html", + "options": {}, + "title": "", + "transparent": true, + "type": "text" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": true, + "colors": [ + "#e6522c", + "rgba(237, 129, 40, 0.89)", + "#299c46" + ], + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 2, + "x": 22, + "y": 1 + }, + "id": 52, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "2.12", + "format": "time_series", + "intervalFactor": 2, + "refId": "A" + } + ], + "thresholds": "10,20", + "title": "", + "transparent": true, + "type": "singlestat", + "valueFontSize": "200%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "avg" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 6 + }, + "id": 54, + "panels": [], + "repeat": null, + "title": "Main info", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 7 + }, + "id": 15, + "legend": { + "avg": true, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "max(prometheus_engine_query_duration_seconds{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, slice)", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "max duration for {{slice}}", + "metric": "prometheus_local_storage_rushed_mode", + "refId": "A", + "step": 900 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Query elapsed time", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": "", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 7 + }, + "id": 17, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_head_series_created_total{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "created on {{ instance }}", + "metric": "prometheus_local_storage_maintain_series_duration_seconds_count", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum(prometheus_tsdb_head_series_removed_total{instance=\"$instance\",nc_region=~\"$region\"}) by (instance) * -1", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "removed on {{ instance }}", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Head series created/deleted", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 7 + }, + "id": 13, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum_over_time(prometheus_target_scrapes_exceeded_sample_limit_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "exceeded_sample_limit on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_target_scrapes_sample_duplicate_timestamp_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "duplicate_timestamp on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "B", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_target_scrapes_sample_out_of_bounds_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "out_of_bounds on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "C", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_target_scrapes_sample_out_of_order_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "out_of_order on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "D", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_rule_evaluation_failures_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "rule_evaluation_failure on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "G", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_tsdb_compactions_failed_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "tsdb_compactions_failed on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "K", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_tsdb_reloads_failures_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "tsdb_reloads_failures on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "L", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_tsdb_head_series_not_found{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "head_series_not_found on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "E", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_evaluator_iterations_missed_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "evaluator_iterations_missed on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "O", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_evaluator_iterations_skipped_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "evaluator_iterations_skipped on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "P", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Prometheus errors", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 14 + }, + "id": 55, + "panels": [], + "repeat": null, + "title": "Scrape & rule duration", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "description": "", + "editable": true, + "error": false, + "fill": 1, + "grid": {}, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 15 + }, + "id": 25, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": false, + "show": false, + "sort": "max", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "prometheus_target_interval_length_seconds{instance=\"$instance\",quantile=\"0.99\",nc_region=~\"$region\"} - 60", + "format": "time_series", + "interval": "2m", + "intervalFactor": 1, + "legendFormat": "{{instance}}", + "metric": "", + "refId": "A", + "step": 300 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Scrape delay (counts with 1m scrape interval)", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 15 + }, + "id": 14, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "Queue length", + "yaxis": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_rule_evaluation_duration_seconds{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, quantile)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Queue length", + "metric": "prometheus_local_storage_indexing_queue_length", + "refId": "B", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Rule evaulation duration", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 22 + }, + "id": 56, + "panels": [], + "repeat": null, + "title": "Requests & queries", + "type": "row" + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 23 + }, + "id": 18, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum_over_time(prometheus_http_requests_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ handler }} on {{ instance }}", + "metric": "", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Request count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 23 + }, + "id": 16, + "legend": { + "avg": false, + "current": false, + "hideEmpty": true, + "hideZero": true, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "max(sum(prometheus_http_request_duration_seconds_sum{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, handler, quantile)) by (instance, handler) > 0", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{ handler }} on {{ instance }}", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Request duration per handler", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "µs", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 23 + }, + "id": 19, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum_over_time(prometheus_http_response_size_bytes_sum{instance=\"$instance\", nc_region=~\"$region\"}[$aggregation_interval]) > 0", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "{{ handler }} in {{ instance }}", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Response size by handler", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Allocated bytes": "#F9BA8F", + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max count collector": "#bf1b00", + "Max count harvester": "#bf1b00", + "Max to persist": "#3F6833", + "RSS": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 23 + }, + "id": 8, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/Max.*/", + "fill": 0, + "linewidth": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_engine_queries{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, handler)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Current count ", + "metric": "last", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum(prometheus_engine_queries_concurrent_max{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, handler)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Max count", + "metric": "last", + "refId": "B", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cont of concurent queries", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 30 + }, + "id": 57, + "panels": [], + "repeat": null, + "title": "Alerting", + "type": "row" + }, + { + "aliasColors": { + "Alert queue capacity on o collector": "#bf1b00", + "Alert queue capacity on o harvester": "#bf1b00", + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 31 + }, + "id": 20, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/.*capacity.*/", + "fill": 0, + "linewidth": 2 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_notifications_queue_capacity{instance=\"$instance\",nc_region=~\"$region\"})by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Alert queue capacity ", + "metric": "prometheus_local_storage_checkpoint_last_size_bytes", + "refId": "A", + "step": 1800 + }, + { + "expr": "sum(prometheus_notifications_queue_length{instance=\"$instance\",nc_region=~\"$region\"})by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Alert queue size on ", + "metric": "prometheus_local_storage_checkpoint_last_size_bytes", + "refId": "B", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Alert queue size", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 31 + }, + "id": 21, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_notifications_alertmanagers_discovered{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Checkpoint chunks written/s", + "metric": "prometheus_local_storage_checkpoint_series_chunks_written_sum", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Count of discovered alertmanagers", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 31 + }, + "id": 39, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum_over_time(prometheus_notifications_dropped_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "notifications_dropped on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "F", + "step": 1800 + }, + { + "expr": "sum_over_time(prometheus_rule_evaluation_failures_total{rule_type=\"alerting\",instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "rule_evaluation_failures on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Alerting errors", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 38 + }, + "id": 58, + "panels": [], + "repeat": null, + "title": "Service discovery", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 39 + }, + "id": 45, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "count_over_time(prometheus_target_sync_length_seconds_count{scrape_job=\"kubernetes-service-endpoints\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Count of target synces", + "refId": "A", + "step": 240 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Kubernetes SD sync count", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 39 + }, + "id": 46, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "prometheus_target_scrapes_exceeded_sample_limit_total{instance=\"$instance\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "exceeded_sample_limit on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "A", + "step": 1800 + }, + { + "expr": "prometheus_sd_file_read_errors_total{instance=\"$instance\",nc_region=~\"$region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 2, + "legendFormat": "sd_file_read_error on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "E", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Service discovery errors", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 46 + }, + "id": 59, + "panels": [], + "repeat": null, + "title": "TSDB stats", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 47 + }, + "id": 36, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(prometheus_tsdb_reloads_total{instance=\"$instance\",nc_region=~\"$region\"}[30m])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Reloaded block from disk", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 47 + }, + "id": 5, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_blocks_loaded{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Loaded data blocks", + "metric": "prometheus_local_storage_memory_chunkdescs", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Loaded data blocks", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 47 + }, + "id": 3, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "prometheus_tsdb_head_series{instance=\"$instance\",nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Time series count", + "metric": "prometheus_local_storage_memory_series", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Time series total count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 47 + }, + "id": 1, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum_over_time(prometheus_tsdb_head_samples_appended_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "samples/s {{instance}}", + "metric": "prometheus_local_storage_ingested_samples_total", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Samples Appended per second", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": "", + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 54 + }, + "id": 60, + "panels": [], + "repeat": null, + "title": "Head block stats", + "type": "row" + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833", + "To persist": "#9AC48A" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 55 + }, + "id": 2, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/Max.*/", + "fill": 0 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_head_chunks{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "Head chunk count", + "metric": "prometheus_local_storage_memory_chunks", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Head chunks count", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 55 + }, + "id": 35, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "max(prometheus_tsdb_head_max_time{instance=\"$instance\",nc_region=~\"$region\"}) by (instance) - min(prometheus_tsdb_head_min_time{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Length of head block", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 55 + }, + "id": 4, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(prometheus_tsdb_head_chunks_created_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "created on {{ instance }}", + "refId": "B" + }, + { + "expr": "sum(rate(prometheus_tsdb_head_chunks_removed_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])) by (instance) * -1", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "deleted on {{ instance }}", + "refId": "C" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Head Chunks Created/Deleted per second", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 62 + }, + "id": 61, + "panels": [], + "repeat": null, + "title": "Data maintenance", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 63 + }, + "id": 33, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum_over_time(prometheus_tsdb_compaction_duration_seconds_sum{instance=\"$instance\",nc_region=~\"$region\"}[30m]) / sum_over_time(prometheus_tsdb_compaction_duration_seconds_count{instance=\"$instance\",nc_region=~\"$region\"}[30m])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ instance }}", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Compaction duration", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 6, + "y": 63 + }, + "id": 34, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_head_gc_duration_seconds_sum{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, quantile)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ quantile }} on {{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Go Garbage collection duration", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 12, + "y": 63 + }, + "id": 37, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_wal_truncate_duration_seconds_sum{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, quantile)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ quantile }} on {{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "WAL truncate duration seconds", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 63 + }, + "id": 38, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(prometheus_tsdb_wal_fsync_duration_seconds{instance=\"$instance\",nc_region=~\"$region\"}) by (instance, quantile)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{ quantile }} {{ instance }}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "WAL fsync duration seconds", + "tooltip": { + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "s", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 70 + }, + "id": 62, + "panels": [], + "repeat": null, + "title": "RAM&CPU", + "type": "row" + }, + { + "aliasColors": { + "Allocated bytes": "#7EB26D", + "Allocated bytes - 1m max": "#BF1B00", + "Allocated bytes - 1m min": "#BF1B00", + "Allocated bytes - 5m max": "#BF1B00", + "Allocated bytes - 5m min": "#BF1B00", + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833", + "RSS": "#447EBC" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": null, + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 71 + }, + "id": 6, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [ + { + "alias": "/-/", + "fill": 0 + }, + { + "alias": "collector heap size", + "color": "#E0752D", + "fill": 0, + "linewidth": 2 + }, + { + "alias": "collector kubernetes memory limit", + "color": "#BF1B00", + "fill": 0, + "linewidth": 3 + } + ], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(process_resident_memory_bytes{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "Total resident memory - {{instance}}", + "metric": "process_resident_memory_bytes", + "refId": "B", + "step": 1800 + }, + { + "expr": "sum(go_memstats_alloc_bytes{instance=\"$instance\",nc_region=~\"$region\"}) by (instance)", + "format": "time_series", + "hide": false, + "intervalFactor": 2, + "legendFormat": "Total llocated bytes - {{instance}}", + "metric": "go_memstats_alloc_bytes", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Memory", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": { + "Allocated bytes": "#F9BA8F", + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833", + "RSS": "#890F02" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 71 + }, + "id": 7, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(go_memstats_alloc_bytes_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "Allocated Bytes/s", + "metric": "go_memstats_alloc_bytes", + "refId": "A", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Allocations per second", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 2, + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 71 + }, + "id": 9, + "legend": { + "alignAsTable": false, + "avg": false, + "current": false, + "hideEmpty": false, + "max": false, + "min": false, + "rightSide": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(rate(process_cpu_seconds_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])) by (instance)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "CPU/s", + "metric": "prometheus_local_storage_ingested_samples_total", + "refId": "B", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "CPU per second", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [ + "avg" + ] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 78 + }, + "id": 63, + "panels": [], + "repeat": null, + "title": "Contrac errors", + "type": "row" + }, + { + "aliasColors": { + "Chunks": "#1F78C1", + "Chunks to persist": "#508642", + "Max chunks": "#052B51", + "Max to persist": "#3F6833" + }, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 1, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 79 + }, + "id": 47, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": false, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum(increase(net_conntrack_dialer_conn_failed_total{instance=\"$instance\",nc_region=~\"$region\"}[$aggregation_interval])) by (instance)", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 2, + "legendFormat": "conntrack_dialer_conn_failed on {{ instance }}", + "metric": "prometheus_local_storage_chunk_ops_total", + "refId": "M", + "step": 1800 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Net errors", + "tooltip": { + "msResolution": false, + "shared": true, + "sort": 2, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "prometheus" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".+", + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(prometheus_build_info{nc_region=~\"$region\"}, instance)", + "hide": 0, + "includeAll": false, + "label": "Instance", + "multi": false, + "name": "instance", + "options": [], + "query": "label_values(prometheus_build_info{nc_region=~\"$region\"}, instance)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 2, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "auto": true, + "auto_count": 30, + "auto_min": "2m", + "current": { + "text": "30m", + "value": "30m" + }, + "hide": 0, + "label": "aggregation intarval", + "name": "aggregation_interval", + "options": [ + { + "selected": false, + "text": "auto", + "value": "$__auto_interval_aggregation_interval" + }, + { + "selected": false, + "text": "1m", + "value": "1m" + }, + { + "selected": false, + "text": "10m", + "value": "10m" + }, + { + "selected": true, + "text": "30m", + "value": "30m" + }, + { + "selected": false, + "text": "1h", + "value": "1h" + }, + { + "selected": false, + "text": "6h", + "value": "6h" + }, + { + "selected": false, + "text": "12h", + "value": "12h" + }, + { + "selected": false, + "text": "1d", + "value": "1d" + }, + { + "selected": false, + "text": "7d", + "value": "7d" + }, + { + "selected": false, + "text": "14d", + "value": "14d" + }, + { + "selected": false, + "text": "30d", + "value": "30d" + } + ], + "query": "1m,10m,30m,1h,6h,12h,1d,7d,14d,30d", + "refresh": 2, + "skipUrlSync": false, + "type": "interval" + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Prometheus2.12.0", + "uid": "prometheus", + "version": 7 + } + calico: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "1.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Calico cluster monitoring dashboard", + "editable": false, + "overwrite": true, + "gnetId": 3244, + "graphTooltip": 0, + "id": 137, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "true": 0, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 15, + "panels": [], + "repeat": null, + "title": "Felix", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 1, + "w": 12, + "x": 0, + "y": 1 + }, + "id": 1, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_active_local_endpoints{nc_region=~\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Local Endpoints", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 1, + "w": 12, + "x": 12, + "y": 1 + }, + "id": 3, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_active_local_policies{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Local Policies", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 8, + "w": 12, + "x": 0, + "y": 8 + }, + "id": 2, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_active_local_selectors{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Local Selectors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 8, + "w": 12, + "x": 12, + "y": 8 + }, + "id": 4, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_active_local_tags{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active Local Tags", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 15, + "w": 12, + "x": 0, + "y": 15 + }, + "id": 5, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_cluster_num_host_endpoints{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Host Endpoints", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 15, + "w": 12, + "x": 12, + "y": 15 + }, + "id": 6, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_cluster_num_workload_endpoints{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Cluster Workload Endpoints", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 22, + "w": 12, + "x": 0, + "y": 22 + }, + "id": 7, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_cluster_num_hosts{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Clusters Hosts", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 22, + "w": 12, + "x": 12, + "y": 22 + }, + "id": 8, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_ipsets_calico{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active IP Sets", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 29, + "w": 12, + "x": 0, + "y": 29 + }, + "id": 9, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_iptables_chains{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Active IP Tables Chains", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 29, + "w": 12, + "x": 12, + "y": 29 + }, + "id": 10, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_ipset_errors{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "IP Set Command Failures", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 36, + "w": 12, + "x": 0, + "y": 36 + }, + "id": 11, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_iptables_save_errors{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "IP Tables Save Errors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 36, + "w": 12, + "x": 12, + "y": 36 + }, + "id": 12, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_iptables_restore_errors{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "IP Tables Restore Errors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 43, + "w": 12, + "x": 0, + "y": 43 + }, + "id": 13, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_resyncs_started{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Felix Resyncing Datastore", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 43, + "w": 12, + "x": 12, + "y": 43 + }, + "id": 14, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_int_dataplane_failures{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Dataplane failed updates", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 43, + "w": 12, + "x": 0, + "y": 50 + }, + "id": 16, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_int_dataplane_addr_msg_batch_size{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Felix int dataplane addr msg batch size", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 43, + "w": 12, + "x": 12, + "y": 50 + }, + "id": 17, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": true, + "min": true, + "show": true, + "total": true, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "felix_int_dataplane_iface_msg_batch_size{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Felix int dataplane iface msg batch size", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "true": 43, + "w": 12, + "x": 0, + "y": 57 + }, + "id": 18, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "go_memstats_frees_total{nc_region=\"$region\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{nc_region}} - {{instance}}", + "refId": "A", + "step": 20 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "go memstats frees total", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [ + "calico" + ], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Kubernetes Calico", + "uid": "kubernetes-calico", + "version": 1 + } + openvswitch: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "6.2.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 82, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 6, + "panels": [], + "title": "SRIOV", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 0, + "y": 1 + }, + "id": 12, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(sriov_rx_bytes{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}} vfid:{{vfid}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "sriov_rx_bytes", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 10, + "y": 1 + }, + "id": 13, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 2, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(sriov_tx_bytes{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}} vfid:{{vfid}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "sriov_tx_bytes", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 0, + "y": 8 + }, + "id": 11, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(sriov_rx_dropped{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}} vfid:{{vfid}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "sriov_rx_dropped", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 10, + "y": 8 + }, + "id": 21, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(sriov_tx_dropped{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}} vfid:{{vfid}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "sriov_tx_dropped", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 0, + "y": 15 + }, + "id": 7, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(sriov_tx_errors{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}} vfid:{{vfid}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "sriov_tx_errors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 22 + }, + "id": 9, + "panels": [], + "title": "Openvswitch", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 0, + "y": 23 + }, + "id": 15, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(ovs_rx_bytes{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "ovs_rx_bytes", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 10, + "y": 23 + }, + "id": 14, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(ovs_tx_bytes{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "ovs_tx_bytes", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 0, + "y": 30 + }, + "id": 10, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(ovs_rx_errors{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "ovs_rx_errors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 10, + "x": 10, + "y": 30 + }, + "id": 20, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rate(ovs_tx_errors{node_name=~\"$node\", nc_region=~\"$region\"}[5m])", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{interface}}", + "refId": "A" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "ovs_tx_errors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus Source", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(node_uname_info{nc_region=\"$region\"}, hostname)", + "hide": 0, + "includeAll": true, + "label": "Node", + "multi": false, + "name": "node", + "options": [], + "query": "label_values(node_uname_info{nc_region=\"$region\"}, hostname)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openvswitch Stats", + "uid": "openvswitch-stats", + "version": 1 + } + openstack-metrics: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 149, + "links": [], + "panels": [ + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#d44a3a", + "#299c46", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 0, + "y": 0 + }, + "id": 12, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_nova", + "dashboard": "Openstack_Services_Nova", + "includeVars": true, + "keepTime": false, + "name": "Drilldown dashboard", + "params": "var-Service=nova", + "title": "Openstack_Services_Nova", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_nova_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Nova_API_Check", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "API OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#d44a3a", + "#299c46", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 3, + "y": 0 + }, + "id": 13, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_neutron", + "dashboard": "Openstack_Services_Neutron", + "includeVars": true, + "name": "Drilldown dashboard", + "params": "var-Service=neutron", + "title": "Openstack_Services_Neutron", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_neutron_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Neutron_API_Check", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "API OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#d44a3a", + "#299c46", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 6, + "y": 0 + }, + "id": 14, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_cinder", + "dashboard": "Openstack_Services_Cinder", + "includeVars": true, + "name": "Drilldown dashboard", + "params": "var-Service=cinder", + "title": "Openstack_Services_Cinder", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_cinder_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Cinder_API_Check", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "API OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#d44a3a", + "#299c46", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 9, + "y": 0 + }, + "id": 10, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_glance", + "dashboard": "Openstack_Services_Glance", + "includeVars": true, + "name": "Drilldown dashboard", + "params": "var-Service=glance", + "title": "Openstack_Services_Glance", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_glance_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Glance_API_Check", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "API OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#d44a3a", + "#cca300", + "#299c46" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 12, + "y": 0 + }, + "id": 15, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_heat", + "dashboard": "Openstack_Services_Heat", + "includeVars": true, + "name": "Drilldown dashboard", + "params": "", + "title": "Openstack_Services_Heat", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(openstack_check_heat_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_check_heat_cfn_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "2,2", + "title": "Heat_API_Check (Heat and Heat_CFN)", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "API OK", + "value": "2" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "1" + }, + { + "op": "=", + "text": "unknown", + "value": "3" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#d44a3a", + "#299c46", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 15, + "y": 0 + }, + "id": 16, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_keystone", + "dashboard": "Openstack_Services_Keystone", + "includeVars": true, + "params": "", + "targetBlank": false, + "title": "Openstack_Services_Keystone", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_keystone_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Keystone_API_Check", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "API OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#d44a3a", + "#299c46", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 18, + "y": 0 + }, + "id": 17, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_swift", + "dashboard": "Openstack_Services_Swift", + "includeVars": true, + "title": "Openstack_Services_Swift", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_swift_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Swift_API_Check", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "API OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#d44a3a", + "#299c46", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 21, + "y": 0 + }, + "id": 18, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_placement", + "dashboard": "Openstack_Services_Placement", + "includeVars": true, + "title": "Openstack_Services_Placement", + "type": "dashboard" + } + ], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_placement_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,2", + "title": "Placement_API_Check", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "API CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "API OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 0, + "y": 5 + }, + "id": 2, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_nova", + "dashboard": "Openstack_Services_Nova", + "includeVars": true, + "name": "Drilldown dashboard", + "params": "", + "title": "Openstack_Services_Nova", + "type": "dashboard" + } + ], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "0", + "text": "Services OK", + "to": "0" + }, + { + "from": "1", + "text": "Services CRITICAL", + "to": "100" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(openstack_services_nova_compute_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_compute_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_conductor_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_conductor_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_scheduler_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_nova_scheduler_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "instant": false, + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,1", + "title": "Nova", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "HEALTHY", + "value": "0" + }, + { + "op": "=", + "text": "UNHEALTHY", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 3, + "y": 5 + }, + "id": 3, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_neutron", + "dashboard": "Openstack_Services_Neutron", + "includeVars": true, + "name": "Drilldown dashboard", + "params": "", + "title": "Openstack_Services_Neutron", + "type": "dashboard" + } + ], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "0", + "text": "Services OK", + "to": "0" + }, + { + "from": "1", + "text": "Services CRITICAL", + "to": "100" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(openstack_services_neutron_l3_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_l3_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_dhcp_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_dhcp_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_metadata_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_metadata_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_openvswitch_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_openvswitch_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_sriov_nic_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_neutron_sriov_nic_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,1", + "title": "Neutron", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "HEALTHY", + "value": "0" + }, + { + "op": "=", + "text": "UNHEALTHY", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 5, + "w": 3, + "x": 6, + "y": 5 + }, + "id": 11, + "interval": "> 60s", + "links": [ + { + "dashUri": "db/openstack_services_cinder", + "dashboard": "Openstack_Services_Cinder", + "includeVars": true, + "name": "Drilldown dashboard", + "params": "", + "title": "Openstack_Services_Cinder", + "type": "dashboard" + } + ], + "mappingType": 2, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "0", + "text": "Services OK", + "to": "0" + }, + { + "from": "1", + "text": "Services CRITICAL", + "to": "100" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(openstack_services_cinder_volume_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_volume_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_backup_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_backup_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_scheduler_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})+sum(openstack_services_cinder_scheduler_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "1,1", + "title": "Cinder", + "type": "singlestat", + "valueFontSize": "50%", + "valueMaps": [ + { + "op": "=", + "text": "no data", + "value": "null" + }, + { + "op": "=", + "text": "CRIT", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + }, + { + "op": "=", + "text": "UNKW", + "value": "2" + } + ], + "valueName": "current" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 10 + }, + "id": 5, + "panels": [], + "title": "Resource Utilization", + "type": "row" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 0, + "gridPos": { + "h": 9, + "w": 8, + "x": 0, + "y": 11 + }, + "id": 7, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": true, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "openstack_total_used_ram_MB{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "Used", + "refId": "A" + }, + { + "expr": "openstack_total_free_ram_MB{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Free", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "os_vm_ram_usage", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decmbytes", + "label": "Memory Usage", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 0, + "gridPos": { + "h": 9, + "w": 8, + "x": 8, + "y": 11 + }, + "id": 8, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": true, + "min": true, + "show": true, + "total": true, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "openstack_total_used_vcpus{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "Used", + "refId": "A" + }, + { + "expr": "openstack_total_free_vcpus{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Free", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "os_vm_vcpu_usage", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "percent", + "label": "VCPU Usage", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 0, + "gridPos": { + "h": 9, + "w": 8, + "x": 16, + "y": 11 + }, + "id": 9, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": " openstack_total_used_disk_GB{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "Used", + "refId": "A" + }, + { + "expr": "openstack_total_free_disk_GB{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Free", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "os_vm_disk_usage", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "GBs", + "label": "disk Usage", + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack Region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Metrics_Overall", + "uid": "openstack-metrics-overall", + "version": 3 + } + openstack-nova: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 76, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 42, + "panels": [], + "title": "Nova API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 40, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_nova_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Nova_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 43, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"nova.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 1 + }, + "id": 44, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_nova_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 7, + "panels": [], + "repeat": "openstack_region", + "title": "Nova", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 0, + "y": 9 + }, + "id": 9, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 1, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "repeat": "type", + "repeatDirection": "v", + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_nova_compute_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "hide": false, + "intervalFactor": 4, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Nova-compute-down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 2, + "y": 9 + }, + "id": 11, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_nova_compute_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Nova-compute-disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 4, + "y": 9 + }, + "id": 20, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_nova_conductor_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Nova-conductor-disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 6, + "y": 9 + }, + "id": 23, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_nova_conductor_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Nova-conductor-down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 8, + "y": 9 + }, + "id": 19, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_nova_scheduler_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Nova-scheduler-down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 10, + "y": 9 + }, + "id": 24, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_nova_scheduler_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Nova-scheduler-disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 0, + "gridPos": { + "h": 9, + "w": 24, + "x": 0, + "y": 16 + }, + "hideTimeOverride": false, + "id": 15, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 1, + "points": false, + "renderer": "flot", + "repeat": null, + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "openstack_services_nova_nova_consoleauth{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + }, + { + "expr": "openstack_services_nova_nova_compute{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "B" + }, + { + "expr": "openstack_services_nova_nova_conductor{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "C" + }, + { + "expr": "openstack_services_nova_nova_scheduler{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "D" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Openstack_service_nova", + "tooltip": { + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": null, + "format": "short", + "label": null, + "logBase": 1, + "max": "1", + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack openstack_region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Services_Nova", + "uid": "openstack-services-nova", + "version": 2 + } + openstack-neutron: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 188, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 42, + "panels": [], + "title": "Neutron API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 40, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_neutron_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Neutron_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 43, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"neutron.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 1 + }, + "id": 44, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_neutron_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 13, + "panels": [], + "repeat": "agent", + "title": "Neutron", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 0, + "y": 9 + }, + "id": 28, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_l3_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_I3_agent_down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 2, + "y": 9 + }, + "id": 26, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_l3_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_I3_agent_disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 4, + "y": 9 + }, + "id": 29, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_dhcp_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_dhcp_agent_down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 6, + "y": 9 + }, + "id": 27, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_dhcp_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_dhcp_agent_disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 8, + "y": 9 + }, + "id": 30, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_metadata_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_metadata_agent_down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 10, + "y": 9 + }, + "id": 31, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_metadata_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$nc_region\", namespace=\"$namespace\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_metadata_agent_disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 12, + "y": 9 + }, + "id": 33, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_openvswitch_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_openvswitch_agent_down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 14, + "y": 9 + }, + "id": 32, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_openvswitch_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$nc_region\", namespace=\"$namespace\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_openvswitch_agent_disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 16, + "y": 9 + }, + "id": 45, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_sriov_nic_agent_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_sriov_nic_agent_down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 18, + "y": 9 + }, + "id": 46, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_neutron_sriov_nic_agent_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "neutron_sriov_nic_agent_disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 0, + "gridPos": { + "h": 9, + "w": 24, + "x": 0, + "y": 16 + }, + "hideTimeOverride": false, + "id": 15, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 1, + "points": false, + "renderer": "flot", + "repeat": null, + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "openstack_services_neutron_neutron_l3_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + }, + { + "expr": "openstack_services_neutron_neutron_metadata_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "B" + }, + { + "expr": "openstack_services_neutron_neutron_dhcp_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "C" + }, + { + "expr": "openstack_services_neutron_neutron_openvswitch_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "D" + }, + { + "expr": "openstack_services_neutron_neutron_sriov_nic_agent{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "E" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Neutron_Agents", + "tooltip": { + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": null, + "format": "short", + "label": null, + "logBase": 1, + "max": "1", + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack openstack_region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Services_Neutron", + "uid": "openstack-services-neutron", + "version": 2 + } + openstack-cinder: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 152, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 42, + "panels": [], + "title": "Cinder API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 40, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_cinder_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Cinder_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 43, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"cinder.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 1 + }, + "id": 44, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_cinder_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 7, + "panels": [], + "repeat": "openstack_region", + "title": "Cinder", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 0, + "y": 9 + }, + "id": 9, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "maxPerRow": 1, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "repeat": "type", + "repeatDirection": "v", + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_cinder_volume_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "hide": false, + "intervalFactor": 4, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Cinder-volume-down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 2, + "y": 9 + }, + "id": 23, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_cinder_volume_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Cinder-volume-disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 4, + "y": 9 + }, + "id": 20, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_cinder_backup_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Cinder-backup-down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 6, + "y": 9 + }, + "id": 22, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_cinder_backup_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Cinder-backup-disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 8, + "y": 9 + }, + "id": 11, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_cinder_scheduler_down_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Cinder-scheduler-down", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "#299c46", + "rgba(237, 129, 40, 0.89)", + "#d44a3a" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 2, + "x": 10, + "y": 9 + }, + "id": 21, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "openstack_services_cinder_scheduler_disabled_total{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "A" + } + ], + "thresholds": "1,1", + "title": "Cinder-scheduler-disabled", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 0, + "gridPos": { + "h": 9, + "w": 24, + "x": 0, + "y": 16 + }, + "hideTimeOverride": false, + "id": 15, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "sort": "current", + "sortDesc": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 1, + "points": false, + "renderer": "flot", + "repeat": null, + "repeatDirection": "h", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "expr": "openstack_services_cinderv3_cinder_volume{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "", + "refId": "A" + }, + { + "expr": "openstack_services_cinderv3_cinder_scheduler{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "B" + }, + { + "expr": "openstack_services_cinderv3_cinder_backup{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "intervalFactor": 1, + "refId": "C" + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Openstack_service_cinder", + "tooltip": { + "shared": true, + "sort": 1, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "decimals": null, + "format": "short", + "label": null, + "logBase": 1, + "max": "1", + "min": "0", + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack openstack_region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Services_Cinder", + "uid": "openstack-services-cinder", + "version": 2 + } + openstack-glance: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 155, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 42, + "panels": [], + "title": "Glance API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 40, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_glance_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Glance_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 43, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"glance.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 1 + }, + "id": 44, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_glance_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack openstack_region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Services_Glance", + "uid": "openstack-services-glance", + "version": 2 + } + openstack-heat: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 158, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 42, + "panels": [], + "title": "Heat API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "#299c46" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 40, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_heat_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Heat_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 43, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"heat.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 1 + }, + "id": 44, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_heat_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 8 + }, + "id": 46, + "panels": [], + "title": "Heat CFN API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "#299c46" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 9 + }, + "id": 48, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_heat_cfn_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Heat_CFN_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 9 + }, + "id": 47, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"heat_cfn.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 9 + }, + "id": 49, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_heat_cfn_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "5m", + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack openstack_region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Services_Heat", + "uid": "openstack-services-heat", + "version": 2 + } + openstack-keystone: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 185, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 42, + "panels": [], + "title": "Keystone API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 40, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_keystone_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\",nc_region=~\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "instant": false, + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Keystone_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 43, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"keystone.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\",nc_region=~\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 1 + }, + "id": 44, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_keystone_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\",nc_region=~\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack openstack_region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Services_Keystone", + "uid": "openstack-service-keystone", + "version": 2 + } + openstack-placement: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 77, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 42, + "panels": [], + "title": "Placement API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 40, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_placement_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "instant": false, + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Placement_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 43, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"placement.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 1 + }, + "id": 44, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_placement_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack openstack_region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": { + "tags": [], + "text": "openstack", + "value": "openstack" + }, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Services_Placement", + "uid": "openstack_services_placement", + "version": 1 + } + openstack-swift: |- + { + "__inputs": [ + { + "name": "DS_PROMETHEUS", + "label": "prometheus", + "description": "", + "type": "datasource", + "pluginId": "prometheus", + "pluginName": "Prometheus" + } + ], + "__requires": [ + { + "type": "grafana", + "id": "grafana", + "name": "Grafana", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "graph", + "name": "Graph", + "version": "5.0.0" + }, + { + "type": "datasource", + "id": "prometheus", + "name": "Prometheus", + "version": "5.0.0" + }, + { + "type": "panel", + "id": "singlestat", + "name": "Singlestat", + "version": "5.0.0" + } + ], + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 203, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 42, + "panels": [], + "title": "Swift API", + "type": "row" + }, + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(225, 177, 40, 0.59)", + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 40, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "openstack_check_swift_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "fill": "", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "null" + ], + "type": "fill" + } + ], + "groupByTags": [], + "groupby_field": "", + "instant": false, + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120 + } + ], + "thresholds": "0,1", + "title": "Swift_API_Service", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "CRITICAL", + "value": "0" + }, + { + "op": "=", + "text": "OK", + "value": "1" + } + ], + "valueName": "current" + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(200, 54, 35, 0.88)", + "rgba(118, 245, 40, 0.73)", + "rgba(225, 177, 40, 0.59)" + ], + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 4, + "y": 1 + }, + "id": 43, + "interval": "> 60s", + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": true + }, + "tableColumn": "", + "targets": [ + { + "column": "value", + "condition": "", + "expr": "sum(nginx_responses_total{server_zone=~\"swift.*\", status_code=\"5xx\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"})", + "fill": "", + "format": "time_series", + "function": "count", + "groupBy": [ + { + "interval": "auto", + "params": [ + "auto" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupby_field": "", + "interval": "", + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "step": 120, + "tags": [] + } + ], + "thresholds": "", + "title": "HTTP 5xx errors", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "0", + "value": "null" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "editable": true, + "error": false, + "fill": 0, + "grid": {}, + "gridPos": { + "h": 7, + "w": 13, + "x": 8, + "y": 1 + }, + "id": 44, + "interval": "> 60s", + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 3, + "links": [], + "nullPointMode": "connected", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": true, + "targets": [ + { + "alias": "healthy", + "column": "value", + "expr": "openstack_check_swift_api{job=\"openstack-metrics\", openstack_region=\"$openstack_region\", namespace=\"$namespace\", nc_region=~\"$nc_region\"}", + "format": "time_series", + "function": "last", + "groupBy": [ + { + "params": [ + "$interval" + ], + "type": "time" + }, + { + "params": [ + "0" + ], + "type": "fill" + } + ], + "groupByTags": [], + "intervalFactor": 2, + "policy": "default", + "rawQuery": false, + "refId": "A", + "resultFormat": "time_series", + "select": [], + "step": 120, + "tags": [] + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "API Availability", + "tooltip": { + "msResolution": false, + "shared": false, + "sort": 0, + "value_type": "cumulative" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": "", + "logBase": 1, + "max": 1, + "min": 0, + "show": true + }, + { + "format": "short", + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": false, + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "nc_region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "hide": 0, + "includeAll": false, + "label": "Openstack openstack_region", + "multi": false, + "name": "openstack_region", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds{nc_region=\"$nc_region\"}, openstack_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "${DS_PROMETHEUS}", + "definition": "", + "hide": 0, + "includeAll": false, + "label": "namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(openstack_exporter_cache_refresh_duration_seconds, namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "Openstack_Services_Swift", + "uid": "openstack-services-swift", + "version": 2 + } + rabbitmq_stats: |- + { + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": "-- Grafana --", + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "Basic rabbitmq host stats: Node Stats, Exchanges, Channels, Consumers, Connections, Queues, Messages, Messages per Queue, Memory, File Descriptors, Sockets.", + "editable": false, + "overwrite": true, + "gnetId": null, + "graphTooltip": 0, + "id": 87, + "links": [], + "panels": [ + { + "cacheTimeout": null, + "colorBackground": true, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "${DS_PROMETHEUS}", + "format": "none", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": false, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 0, + "y": 0 + }, + "id": 13, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "options": {}, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "30%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "count (rabbitmq_up{nc_region=~\"$region\"} == 1)", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "metric": "rabbitmq_up", + "refId": "A", + "step": 2 + } + ], + "thresholds": "Up,Down", + "timeFrom": "30s", + "title": "RabbitMQ Server", + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + }, + { + "op": "=", + "text": "Down", + "value": "0" + }, + { + "op": ">=", + "text": "Up", + "value": "1" + } + ], + "valueName": "current" + }, + { + "aliasColors": {}, + "bars": true, + "dashLength": 10, + "dashes": false, + "datasource": "prometheus", + "decimals": 0, + "fill": 1, + "gridPos": { + "h": 7, + "w": 18, + "x": 6, + "y": 0 + }, + "id": 12, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "show": true, + "total": false, + "values": true + }, + "lines": false, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_running{nc_region=~\"$region\",node=~\"$rabbitmq_node\"}", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "{{pod}}", + "metric": "rabbitmq_running", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": "30s", + "timeRegions": [], + "timeShift": null, + "title": "Node up Stats", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 7 + }, + "id": 6, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_exchanges{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{release_group}}:exchanges", + "metric": "rabbitmq_exchangesTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Number of Exchanges", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 7 + }, + "id": 4, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_channels{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{release_group}}:channels", + "metric": "rabbitmq_channelsTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Number of Channels", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 7 + }, + "id": 3, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_consumers{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{release_group}}:consumers", + "metric": "rabbitmq_consumersTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Number of Consumers", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 14 + }, + "id": 5, + "legend": { + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_connections{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{release_group}}:connections", + "metric": "rabbitmq_connectionsTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Number of Connections", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 14 + }, + "id": 7, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_queues{nc_region=~\"$region\",kubernetes_namespace=~\"$namespace\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{release_group}}:queues", + "metric": "rabbitmq_queuesTotal", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Number of Queues", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 21 + }, + "id": 8, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "sum by (vhost)(rabbitmq_queue_messages_ready{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{vhost}}:ready", + "metric": "rabbitmq_queue_messages_ready", + "refId": "A", + "step": 2 + }, + { + "expr": "sum by (vhost)(rabbitmq_queue_messages_published_total{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{vhost}}:published", + "metric": "rabbitmq_queue_messages_published_total", + "refId": "B", + "step": 2 + }, + { + "expr": "sum by (vhost)(rabbitmq_queue_messages_delivered_total{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{vhost}}:delivered", + "metric": "rabbitmq_queue_messages_delivered_total", + "refId": "C", + "step": 2 + }, + { + "expr": "sum by (vhost)(rabbitmq_queue_messages_unacknowledged{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"})", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{vhost}}:unack", + "metric": "ack", + "refId": "D", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Messages/host", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "decimals": 0, + "fill": 1, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 21 + }, + "id": 2, + "legend": { + "alignAsTable": true, + "avg": false, + "current": true, + "max": false, + "min": false, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_queue_messages{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{queue}}:{{durable}}", + "metric": "rabbitmq_queue_messages", + "refId": "A", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Messages / Queue", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 28 + }, + "id": 9, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_node_mem_used{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{pod}}:used", + "metric": "rabbitmq_node_mem_used", + "refId": "A", + "step": 2 + }, + { + "expr": "rabbitmq_node_mem_limit{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{pod}}:limit", + "metric": "node_mem", + "refId": "B", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Memory", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "decbytes", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 28 + }, + "id": 10, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_fd_used{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{pod}}:used", + "metric": "", + "refId": "A", + "step": 2 + }, + { + "expr": "rabbitmq_fd_total{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{pod}}:total", + "metric": "node_mem", + "refId": "B", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "FIle descriptors", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "${DS_PROMETHEUS}", + "fill": 1, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 35 + }, + "id": 11, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "options": {}, + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "expr": "rabbitmq_sockets_used{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{pod}}:used", + "metric": "", + "refId": "A", + "step": 2 + }, + { + "expr": "rabbitmq_sockets_total{nc_region=~\"$region\", kubernetes_namespace=~\"$namespace\", node=~\"$rabbitmq_node\"}", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "{{pod}}:total", + "metric": "", + "refId": "B", + "step": 2 + } + ], + "thresholds": [], + "timeFrom": null, + "timeRegions": [], + "timeShift": null, + "title": "Sockets ", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": true + } + ], + "yaxis": { + "align": false, + "alignLevel": null + } + } + ], + "refresh": "1m", + "schemaVersion": 18, + "style": "dark", + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "prometheus", + "value": "prometheus" + }, + "hide": 0, + "includeAll": false, + "label": "Prometheus datasource", + "multi": false, + "name": "DS_PROMETHEUS", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "type": "datasource" + }, + { + "allValue": ".+", + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(nc_region)", + "hide": 0, + "includeAll": false, + "label": "NC Region", + "multi": false, + "name": "region", + "options": [], + "query": "label_values(nc_region)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(rabbitmq_up{nc_region=\"$region\"}, kubernetes_namespace)", + "hide": 0, + "includeAll": false, + "label": "Namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(rabbitmq_up{nc_region=\"$region\"}, kubernetes_namespace)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$DS_PROMETHEUS", + "definition": "label_values(rabbitmq_up{kubernetes_namespace=\"$namespace\"}, node)", + "hide": 0, + "includeAll": false, + "label": "Node", + "multi": false, + "name": "rabbitmq_node", + "options": [], + "query": "label_values(rabbitmq_up{kubernetes_namespace=\"$namespace\"}, node)", + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-1h", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "UTC", + "title": "RabbitMQ Stats", + "uid": "rabbitmq-stats", + "version": 4 + } dependencies: - grafana-htk ... diff --git a/global/software/charts/osh-infra/osh-infra-dashboards/kibana.yaml b/global/software/charts/osh-infra/osh-infra-dashboards/kibana.yaml index 5931ca706..f6866e09a 100644 --- a/global/software/charts/osh-infra/osh-infra-dashboards/kibana.yaml +++ b/global/software/charts/osh-infra/osh-infra-dashboards/kibana.yaml @@ -99,21 +99,23 @@ data: create_kibana_indexes: enabled: true indexes: - - airship - - audit_tsee - - auth - - calico - - ceph - - flows - - jenkins - - journal - - kernel_syslog - - libvirt - - logstash - - lma - - openstack - - utility_access - - openvswitch + base: + - airship + - audit_tsee + - auth + - calico + - ceph + - flows + - jenkins + - journal + - kernel_syslog + - libvirt + - logstash + - lma + - utility_access + application: + - openstack + - openvswitch default_index: logstash kibana: elasticsearch: diff --git a/global/software/charts/osh/openstack-compute-kit/chart-group.yaml b/global/software/charts/osh/openstack-compute-kit/chart-group.yaml index 6fd239081..6b76be83f 100644 --- a/global/software/charts/osh/openstack-compute-kit/chart-group.yaml +++ b/global/software/charts/osh/openstack-compute-kit/chart-group.yaml @@ -10,9 +10,10 @@ metadata: layer: global storagePolicy: cleartext data: - description: Deploy Nova, Neutron, Openvswitch, and Libvirt + description: Deploy Nova, Neutron, Openvswitch, Placement, and Libvirt chart_group: - libvirt - openvswitch - neutron + - placement - nova diff --git a/global/software/charts/osh/openstack-compute-kit/neutron.yaml b/global/software/charts/osh/openstack-compute-kit/neutron.yaml index bc20103ae..bcf575c6f 100644 --- a/global/software/charts/osh/openstack-compute-kit/neutron.yaml +++ b/global/software/charts/osh/openstack-compute-kit/neutron.yaml @@ -236,7 +236,7 @@ data: native: enabled: false test: - timeout: 720 + timeout: 1400 install: no_hooks: false upgrade: diff --git a/global/software/charts/osh/openstack-compute-kit/nova.yaml b/global/software/charts/osh/openstack-compute-kit/nova.yaml index 5cfa1a5cd..ff3acff48 100644 --- a/global/software/charts/osh/openstack-compute-kit/nova.yaml +++ b/global/software/charts/osh/openstack-compute-kit/nova.yaml @@ -325,6 +325,20 @@ data: post: create: [] values: + manifests: + # NOTE(lamt): disable consoleauth and placement from nova in Train release. + certificates: false + deployment_consoleauth: false + deployment_placement: false + ingress_placement: false + job_db_init_placement: false + job_ks_placement_endpoints: false + job_ks_placement_service: false + job_ks_placement_user: false + pdb_placement: false + secret_keystone_placement: false + service_ingress_placement: false + service_placement: false dependencies: static: rabbit_init: @@ -775,20 +789,14 @@ data: values: - RetryFilter - AvailabilityZoneFilter - - RamFilter - - CoreFilter - - DiskFilter - ComputeFilter - ImagePropertiesFilter - ServerGroupAntiAffinityFilter - ServerGroupAffinityFilter - AggregateInstanceExtraSpecsFilter - - AggregateCoreFilter - - AggregateRamFilter - AggregateMultiTenancyIsolation - JsonFilter - IoOpsFilter - - AggregateDiskFilter - AllHostsFilter - IsolatedHostsFilter - AggregateImagePropertiesIsolation @@ -816,6 +824,7 @@ data: key_pairs: 10 cinder: http_retries: 6 + catalog_info: "volumev3::internalURL" oslo_messaging_rabbit: heartbeat_timeout_threshold: 60 audit_middleware_notifications: diff --git a/global/software/charts/osh/openstack-compute-kit/placement.yaml b/global/software/charts/osh/openstack-compute-kit/placement.yaml new file mode 100644 index 000000000..f8c7f64ad --- /dev/null +++ b/global/software/charts/osh/openstack-compute-kit/placement.yaml @@ -0,0 +1,416 @@ +--- +schema: armada/Chart/v1 +metadata: + schema: metadata/Document/v1 + name: placement + labels: + name: placement-global + component: placement + layeringDefinition: + abstract: false + layer: global + storagePolicy: cleartext + substitutions: + # Chart source + - src: + schema: pegleg/SoftwareVersions/v1 + name: software-versions + path: .charts.osh.placement + dest: + path: .source + + # Images + - src: + schema: pegleg/SoftwareVersions/v1 + name: software-versions + path: .images.osh.placement + dest: + path: .values.images.tags + + # Endpoints + - src: + schema: pegleg/EndpointCatalogue/v1 + name: osh_endpoints + path: .osh.identity + dest: + path: .values.endpoints.identity + - src: + schema: pegleg/EndpointCatalogue/v1 + name: osh_endpoints + path: .osh.oslo_db + dest: + path: .values.endpoints.oslo_db + - src: + schema: pegleg/EndpointCatalogue/v1 + name: osh_endpoints + path: .osh.oslo_messaging + dest: + path: .values.endpoints.oslo_messaging + - src: + schema: pegleg/EndpointCatalogue/v1 + name: osh_endpoints + path: .osh.oslo_cache + dest: + path: .values.endpoints.oslo_cache + - src: + schema: pegleg/EndpointCatalogue/v1 + name: osh_endpoints + path: .osh.placement + dest: + path: .values.endpoints.placement + + # Service Accounts + - src: + schema: pegleg/AccountCatalogue/v1 + name: osh_service_accounts + path: .osh.keystone.admin + dest: + path: .values.endpoints.identity.auth.admin + - src: + schema: pegleg/AccountCatalogue/v1 + name: osh_service_accounts + path: .osh.placement.placement + dest: + path: .values.endpoints.identity.auth.placement + - src: + schema: pegleg/AccountCatalogue/v1 + name: osh_service_accounts + path: .osh.placement.test + dest: + path: .values.endpoints.identity.auth.test + - src: + schema: pegleg/AccountCatalogue/v1 + name: osh_service_accounts + path: .osh.oslo_messaging.admin + dest: + path: .values.endpoints.oslo_messaging.auth.admin + - src: + schema: pegleg/AccountCatalogue/v1 + name: osh_service_accounts + path: .osh.nova.oslo_messaging.placement + dest: + path: .values.endpoints.oslo_messaging.auth.placement + - src: + schema: pegleg/AccountCatalogue/v1 + name: osh_service_accounts + path: .osh.placement.oslo_db.username + dest: + path: .values.endpoints.oslo_db.auth.placement.username + - src: + schema: pegleg/AccountCatalogue/v1 + name: osh_service_accounts + path: .osh.placement.oslo_db.database + dest: + path: .values.endpoints.oslo_db.path + pattern: DB_NAME + + # Secrets + - dest: + path: .values.endpoints.identity.auth.admin.password + src: + schema: deckhand/Passphrase/v1 + name: osh_keystone_admin_password + path: . + - dest: + path: .values.endpoints.identity.auth.placement.password + src: + schema: deckhand/Passphrase/v1 + name: osh_placement_password + path: . + - dest: + path: .values.endpoints.identity.auth.test.password + src: + schema: deckhand/Passphrase/v1 + name: osh_nova_test_password + path: . + - dest: + path: .values.endpoints.identity.auth.neutron.password + src: + schema: deckhand/Passphrase/v1 + name: osh_neutron_password + path: . + - dest: + path: .values.endpoints.identity.auth.placement.password + src: + schema: deckhand/Passphrase/v1 + name: osh_placement_password + path: . + - dest: + path: .values.endpoints.identity.auth.ironic.password + src: + schema: deckhand/Passphrase/v1 + name: osh_ironic_password + path: . + - dest: + path: .values.endpoints.oslo_messaging.auth.admin.password + src: + schema: deckhand/Passphrase/v1 + name: osh_oslo_messaging_admin_password + path: . + - dest: + path: .values.endpoints.oslo_messaging.auth.placement.password + src: + schema: deckhand/Passphrase/v1 + name: osh_nova_oslo_messaging_password + path: . + - dest: + path: .values.endpoints.oslo_db.auth.placement.password + src: + schema: deckhand/Passphrase/v1 + name: osh_nova_oslo_db_password + path: . + - dest: + path: .values.endpoints.oslo_db.auth.admin.password + src: + schema: deckhand/Passphrase/v1 + name: osh_oslo_db_admin_password + path: . + - dest: + path: .values.endpoints.oslo_cache.auth.memcache_secret_key + src: + schema: deckhand/Passphrase/v1 + name: osh_oslo_cache_secret_key + path: . + - dest: + path: .values.endpoints.oslo_db.auth.nova_api.password + src: + schema: deckhand/Passphrase/v1 + name: osh_nova_oslo_db_password + path: . + - dest: + path: .values.endpoints.oslo_db.auth.nova_api.username + src: + schema: pegleg/AccountCatalogue/v1 + name: osh_service_accounts + path: .osh.nova.oslo_db.username + + +data: + chart_name: placement + release: placement + namespace: openstack + wait: + timeout: 2700 + labels: + release_group: clcp-placement + resources: + - type: job + - type: deployment + min_ready: 100% + native: + enabled: false + test: + timeout: 600 + install: + no_hooks: false + upgrade: + no_hooks: false + pre: + delete: + - type: job + labels: + release_group: clcp-placement + post: + create: [] + values: + manifests: + certificates: false + job_db_migrate: false + dependencies: + static: + rabbit_init: + services: + - endpoint: internal + service: oslo_messaging + jobs: + - clcp-openstack-rabbitmq-cluster-wait + db_sync: + jobs: + - placement-db-init + labels: + job: + node_selector_key: openstack-control-plane + node_selector_value: enabled + api: + node_selector_key: openstack-control-plane + node_selector_value: enabled + test: + node_selector_key: openstack-control-plane + node_selector_value: enabled + pod: + mandatory_access_control: + type: apparmor + placement-api: + placement-api: runtime/default + init: runtime/default + placement-db-migrate: + init: runtime/default + placement-mysql-migration: runtime/default + replicas: + api: 4 + affinity: + anti: + type: + placement: requiredDuringSchedulingIgnoredDuringExecution + weight: + default: 100 + lifecycle: + upgrades: + deployments: + pod_replacement_strategy: RollingUpdate + rolling_update: + max_unavailable: 50% + security_context: + placement: + container: + placement_api: + allowPrivilegeEscalation: false + network: + api: + ingress: + annotations: + nginx.ingress.kubernetes.io/backend-protocol: "https" + nginx.ingress.kubernetes.io/configuration-snippet: | + more_set_headers "X-XSS-Protection: 1; mode=block"; + more_set_headers "X-Frame-Options: deny"; + if ($request_method !~ ^(HEAD|GET|POST|PUT|PATCH|DELETE)$ ) { + return 405; + } + conf: + logging: + loggers: + keys: + - root + - placement + - oslo.messaging + handlers: + keys: + - stdout + - stderr + - "null" + formatters: + keys: + - context + - default + logger_root: + level: WARNING + handlers: "null" + logger_placement: + level: INFO + handlers: + - stdout + qualname: placement + logger_oslo.messaging: + level: INFO + handlers: + - stdout + qualname: oslo.messaging + logger_amqp: + level: WARNING + handlers: stderr + qualname: amqp + logger_amqplib: + level: WARNING + handlers: stderr + qualname: amqplib + logger_eventletwsgi: + level: WARNING + handlers: stderr + qualname: eventlet.wsgi.server + logger_sqlalchemy: + level: WARNING + handlers: stderr + qualname: sqlalchemy + logger_boto: + level: WARNING + handlers: stderr + qualname: boto + handler_null: + class: logging.NullHandler + formatter: default + args: () + handler_stdout: + class: StreamHandler + args: (sys.stdout,) + formatter: context + handler_stderr: + class: StreamHandler + args: (sys.stderr,) + formatter: context + formatter_context: + class: oslo_log.formatters.ContextFormatter + formatter_default: + format: "%(message)s" + policy: + "context_is_admin": "role:admin" + "admin_or_owner": "rule:context_is_admin or project_id:%(project_id)s" + "default": "rule:admin_or_owner" + "admin_api": "role:admin" + "placement:resource_providers:list": "rule:admin_api" + "placement:resource_providers:create": "rule:admin_api" + "placement:resource_providers:show": "rule:admin_api" + "placement:resource_providers:update": "rule:admin_api" + "placement:resource_providers:delete": "rule:admin_api" + "placement:resource_classes:list": "rule:admin_api" + "placement:resource_classes:create": "rule:admin_api" + "placement:resource_classes:show": "rule:admin_api" + "placement:resource_classes:update": "rule:admin_api" + "placement:resource_classes:delete": "rule:admin_api" + "placement:resource_providers:inventories:list": "rule:admin_api" + "placement:resource_providers:inventories:create": "rule:admin_api" + "placement:resource_providers:inventories:show": "rule:admin_api" + "placement:resource_providers:inventories:update": "rule:admin_api" + "placement:resource_providers:inventories:delete": "rule:admin_api" + "placement:resource_providers:aggregates:list": "rule:admin_api" + "placement:resource_providers:aggregates:update": "rule:admin_api" + "placement:resource_providers:usages": "rule:admin_api" + "placement:usages": "rule:admin_api" + "placement:traits:list": "rule:admin_api" + "placement:traits:show": "rule:admin_api" + "placement:traits:update": "rule:admin_api" + "placement:traits:delete": "rule:admin_api" + "placement:resource_providers:traits:list": "rule:admin_api" + "placement:resource_providers:traits:update": "rule:admin_api" + "placement:resource_providers:traits:delete": "rule:admin_api" + "placement:allocations:manage": "rule:admin_api" + "placement:allocations:list": "rule:admin_api" + "placement:allocations:update": "rule:admin_api" + "placement:allocations:delete": "rule:admin_api" + "placement:resource_providers:allocations:list": "rule:admin_api" + "placement:allocation_candidates:list": "rule:admin_api" + "placement:reshaper:reshape": "rule:admin_api" + "not_implemented_in_aic": '!' + placement: + DEFAULT: + debug: false + dependencies: + - os-placement-htk +... +--- +schema: armada/Chart/v1 +metadata: + schema: metadata/Document/v1 + name: os-placement-htk + layeringDefinition: + abstract: false + layer: global + substitutions: + - src: + schema: pegleg/SoftwareVersions/v1 + name: software-versions + path: .charts.osh.placement-htk + dest: + path: .source + storagePolicy: cleartext +data: + chart_name: os-placement-htk + release: os-placement-htk + namespace: os-placement-htk + timeout: 600 + wait: + timeout: 600 + upgrade: + no_hooks: true + values: {} + dependencies: [] +... diff --git a/global/software/charts/ucp/ceph/ceph-client-update.yaml b/global/software/charts/ucp/ceph/ceph-client-update.yaml index c7f3e7da2..666e47699 100644 --- a/global/software/charts/ucp/ceph/ceph-client-update.yaml +++ b/global/software/charts/ucp/ceph/ceph-client-update.yaml @@ -123,13 +123,13 @@ data: enabled: true script: | set -x - DESIRED_VERSION="octopus" + DESIRED_VERSION="nautilus" ADDITIONAL_VERSIONS=1 while [ $ADDITIONAL_VERSIONS -gt 0 ]; do sleep 5 - ADDITIONAL_VERSIONS=$(ceph tell osd.* version --format json | awk -F 'osd.[0-9]*: ' '/^osd/ { print $2}' | jq -r '.release' | uniq | grep -v ${DESIRED_VERSION} | wc -l ) + ADDITIONAL_VERSIONS=$(ceph tell osd.* version --format json | awk -F 'osd.[0-9]*: ' '/^osd/ { print $2}' | jq -r '.version' | awk '{ print $(NF-1) }' | uniq | grep -v ${DESIRED_VERSION} | wc -l ) done - while [[ `ceph pg stat -f json | jq -r ".pg_summary.num_pgs"` -eq 0 ]] || [[ `ceph pg ls -f json | jq -r '.pg_stats[].state' | grep -v "active"` ]] + while [[ `ceph pg ls | tail -n +2 | grep -v "active+\|NOTE"` ]] do sleep 5 done @@ -239,9 +239,7 @@ data: features: # NOTE(st053q): If autoscaler is disabled, then # mon_pg_warn_max_object_skew should not be 0 in ceph.conf - pg_autoscaler: true - cluster_flags: - unset: "noup" + pg_autoscaler: false pool: spec: # Health metrics pool diff --git a/global/software/charts/ucp/ceph/ceph-client.yaml b/global/software/charts/ucp/ceph/ceph-client.yaml index a1823a9a7..2325cf630 100644 --- a/global/software/charts/ucp/ceph/ceph-client.yaml +++ b/global/software/charts/ucp/ceph/ceph-client.yaml @@ -93,6 +93,7 @@ data: component: test test: enabled: true + timeout: 3600 values: labels: job: @@ -211,8 +212,6 @@ data: conf: features: pg_autoscaler: false - cluster_flags: - set: "noup" pool: spec: # Health metrics pool diff --git a/global/software/config/endpoints.yaml b/global/software/config/endpoints.yaml index 1a705bf6f..d78fcec10 100644 --- a/global/software/config/endpoints.yaml +++ b/global/software/config/endpoints.yaml @@ -256,6 +256,10 @@ data: podport: 10283 status: podport: 18089 + stream: + podport: 18090 + profiler: + podport: 18088 kubernetesprovisioner: name: promenade hosts: diff --git a/global/software/config/versions.yaml b/global/software/config/versions.yaml index 8aad81e42..eb1bcd084 100644 --- a/global/software/config/versions.yaml +++ b/global/software/config/versions.yaml @@ -201,7 +201,7 @@ data: type: git cinder-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git glance: @@ -211,7 +211,7 @@ data: type: git glance-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git heat: @@ -221,7 +221,7 @@ data: type: git heat-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git helm_toolkit: @@ -236,7 +236,7 @@ data: type: git horizon-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git ingress: @@ -251,7 +251,7 @@ data: type: git keystone: location: https://opendev.org/openstack/openstack-helm - reference: 28d0a56e46129276559a4ddb2dea32c35b10b58e + reference: d467d685a3863edc5fed7c352961b3235a5e3a99 subpath: keystone type: git keystone-htk: @@ -266,7 +266,7 @@ data: type: git libvirt-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 3dd0eb0cdf54387447f07a4ec6be9582c457a1a8 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git mariadb: @@ -276,7 +276,7 @@ data: type: git mariadb-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: b482b57e6ea85eceef02787cb2e8eb884cceb80c + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git memcached: @@ -296,17 +296,17 @@ data: type: git neutron-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 4f30b1361e2b596ce8760fd593f08d4f9a6639fe + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git nova: location: https://opendev.org/openstack/openstack-helm - reference: 4aa7a3026706758d22dc3e7002a2a0bffcfd84ea + reference: 2ec17153c6cb918dd357f71824ec59dd0d74dfba subpath: nova type: git nova-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 017c8df602cbe33ae3e70a7125ee94886136e850 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git openvswitch: @@ -316,17 +316,27 @@ data: type: git openvswitch-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: d0b32ed88ad652d9c2226466a13bac8b28038399 + reference: f08d30df6b871044135534eedf76c8f2760d9923 + subpath: helm-toolkit + type: git + placement: + location: https://opendev.org/openstack/openstack-helm + reference: 2ec17153c6cb918dd357f71824ec59dd0d74dfba + subpath: placement + type: git + placement-htk: + location: https://opendev.org/openstack/openstack-helm-infra + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git rabbitmq: location: https://opendev.org/openstack/openstack-helm-infra - reference: 1a8536fd5d9c3c05a0c4b5cd0e6e4a502c9c53bc + reference: 5c8bd68e764b22122d6be4cbda04cfdc76223b23 subpath: rabbitmq type: git rabbitmq-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 832718629f3d967c0bca7f28c53f57cd5ad4ddaa + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git tempest: @@ -352,12 +362,12 @@ data: type: git mariadb: location: https://opendev.org/openstack/openstack-helm-infra - reference: ba601e0cba1bb584fe3bce07f96f8e5b98b12889 + reference: 6dd39da6ad7ffd744ecff423e99637aadd9c0414 subpath: mariadb type: git mariadb-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: a4568f31e2e9d09c8f318a9d938c9a16f0da59ef + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git mini-mirror: @@ -403,7 +413,7 @@ data: osh_infra: ceph-rgw: location: https://opendev.org/openstack/openstack-helm-infra - reference: 20cf2db961a05285a751b3bc96b8fa4e51e3b412 + reference: eacf93722136636dcfbd2b68c59b71f071ffc085 subpath: ceph-rgw type: git ceph-rgw-htk: @@ -413,17 +423,17 @@ data: type: git elasticsearch: location: https://opendev.org/openstack/openstack-helm-infra - reference: a2c1eea8a982de777fa430efdf188d556630f3f0 + reference: fd4bf572111b75f1a73396c6d3b714259b53a024 subpath: elasticsearch type: git elasticsearch-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: a78ee39dcb9209a4ba6cc87f2989481a9fa63fc1 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git fluentd: location: https://opendev.org/openstack/openstack-helm-infra - reference: 59164428d305bf72dd67733a184266fd1217c153 + reference: ddd5a74319142b14d42271da6727e76637133869 subpath: fluentd type: git fluentd-htk: @@ -433,22 +443,22 @@ data: type: git grafana: location: https://opendev.org/openstack/openstack-helm-infra - reference: 128c3f748aee3ae72cccca0ff17a71ac1ed5c2fb + reference: 87e3a02dd558dfca6a9a8f49feb34f47d516cbf7 subpath: grafana type: git grafana-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: a78ee39dcb9209a4ba6cc87f2989481a9fa63fc1 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git kibana: location: https://opendev.org/openstack/openstack-helm-infra - reference: b62a46336c1b6ca86e48710ba85c9320f3075fd5 + reference: 9a719e2a18bfd4f1daa57d1a4397d89966653b18 subpath: kibana type: git kibana-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: a78ee39dcb9209a4ba6cc87f2989481a9fa63fc1 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git local-storage: @@ -488,7 +498,7 @@ data: type: git prometheus-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: a78ee39dcb9209a4ba6cc87f2989481a9fa63fc1 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git prometheus_kube_state_metrics: @@ -549,7 +559,7 @@ data: type: git armada-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 926348fe2476051f9ca825916db333f81c0139b7 + reference: 44947cc80b91510da6f68a434c847af2d260cabd subpath: helm-toolkit type: git barbican: @@ -559,12 +569,12 @@ data: type: git barbican-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: c2ece6a45aea1a4d52942eeba23b5d37de70c082 + reference: 2b20674cad133581e1259ac87470ba0f6cca313b subpath: helm-toolkit type: git ceph-client: location: https://opendev.org/openstack/openstack-helm-infra - reference: dd39a0f7e08c9eee861b9fa23e9587d440b76c43 + reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e subpath: ceph-client type: git ceph-htk: @@ -574,22 +584,22 @@ data: type: git ceph-mon: location: https://opendev.org/openstack/openstack-helm-infra - reference: 4eee89ccba75a34b222d2f828129d0d5f26ffd23 + reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e subpath: ceph-mon type: git ceph-osd: location: https://opendev.org/openstack/openstack-helm-infra - reference: 4ed24de14b562607742a246906b48fba647d3ce8 + reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e subpath: ceph-osd type: git ceph-provisioners: location: https://opendev.org/openstack/openstack-helm-infra - reference: 4ed24de14b562607742a246906b48fba647d3ce8 + reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e subpath: ceph-provisioners type: git ceph-rgw: location: https://opendev.org/openstack/openstack-helm-infra - reference: 20cf2db961a05285a751b3bc96b8fa4e51e3b412 + reference: 2f8ea3977ba31a4576ffb9bf98282d0586d1aa25 subpath: ceph-rgw type: git deckhand: @@ -599,7 +609,7 @@ data: type: git deckhand-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 926348fe2476051f9ca825916db333f81c0139b7 + reference: 8b09a074232fd1abff26055fd975ce742bc7d71b subpath: helm-toolkit type: git divingbell: @@ -619,7 +629,7 @@ data: type: git drydock-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 926348fe2476051f9ca825916db333f81c0139b7 + reference: 9061d08a5e41a94fd92e60d860bfa7464d2a3cb5 subpath: helm-toolkit type: git ingress: @@ -634,7 +644,7 @@ data: type: git keystone: location: https://opendev.org/openstack/openstack-helm - reference: 28d0a56e46129276559a4ddb2dea32c35b10b58e + reference: d467d685a3863edc5fed7c352961b3235a5e3a99 subpath: keystone type: git keystone-htk: @@ -649,7 +659,7 @@ data: type: git maas-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: d0f808a64e2b0340aeefcfc4c6107bc825a9fc99 + reference: d96b724310252c259041c216e1c110062e506347 subpath: helm-toolkit type: git mariadb: @@ -659,7 +669,7 @@ data: type: git mariadb-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: f08d30df6b871044135534eedf76c8f2760d9923 + reference: 2dc83fdde7d9a7efe378730e480efbdbdde997db subpath: helm-toolkit type: git memcached: @@ -679,12 +689,12 @@ data: type: git postgresql-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 4a770bb90846e7bd5fd32be4fcbce95b4218be01 + reference: 25aa3690252c605d237c187524d0adf73a8424e5 subpath: helm-toolkit type: git promenade: location: https://opendev.org/airship/promenade - reference: 27f181a9d30294030d695b747b2e4560ffbd29be + reference: d161528ae8de0dcb0dd9d39bc370f85f2aa1c462 subpath: charts/promenade type: git promenade-htk: @@ -709,12 +719,12 @@ data: type: git shipyard-htk: location: https://opendev.org/openstack/openstack-helm-infra - reference: 926348fe2476051f9ca825916db333f81c0139b7 + reference: b50fae62a4ad0992ce877cd632800e1eed5f71a9 subpath: helm-toolkit type: git tenant-ceph-client: location: https://opendev.org/openstack/openstack-helm-infra - reference: dd39a0f7e08c9eee861b9fa23e9587d440b76c43 + reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e subpath: ceph-client type: git tenant-ceph-htk: @@ -724,22 +734,22 @@ data: type: git tenant-ceph-mon: location: https://opendev.org/openstack/openstack-helm-infra - reference: 4eee89ccba75a34b222d2f828129d0d5f26ffd23 + reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e subpath: ceph-mon type: git tenant-ceph-osd: location: https://opendev.org/openstack/openstack-helm-infra - reference: 4ed24de14b562607742a246906b48fba647d3ce8 + reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e subpath: ceph-osd type: git tenant-ceph-provisioners: location: https://opendev.org/openstack/openstack-helm-infra - reference: 4ed24de14b562607742a246906b48fba647d3ce8 + reference: 8d9b7fdd2b146dc8a1578d6ee23c79aa3116f87e subpath: ceph-provisioners type: git tenant-ceph-rgw: location: https://opendev.org/openstack/openstack-helm-infra - reference: 20cf2db961a05285a751b3bc96b8fa4e51e3b412 + reference: 2f8ea3977ba31a4576ffb9bf98282d0586d1aa25 subpath: ceph-rgw type: git tiller: @@ -832,11 +842,12 @@ data: busybox: &busybox docker.io/busybox:1.28.3 alpine-38: &alpine-38 docker.io/alpine:3.8 airflow: &airflow quay.io/airshipit/airflow:f0f876afef07f62cd38fbce8b775cfc741e0bf52-ubuntu_xenial - armada: &armada quay.io/airshipit/armada:7ef4b8643b5ec5216a8f6726841e156c0aa54a1a-ubuntu_bionic + #armada: &armada quay.io/airshipit/armada:7ef4b8643b5ec5216a8f6726841e156c0aa54a1a-ubuntu_bionic + armada: &armada quay.io/airshipit/armada:b37417253f99f23549e09502e3bcd81d450bb4c4-ubuntu_bionic barbican: &barbican docker.io/openstackhelm/barbican@sha256:4c44bb9e5d29224007b2ef52c1ce4ff756e655efe9c6e9a95b2e98f4f501499e #ceph_daemon: &ceph_daemon docker.io/openstackhelm/ceph-daemon:ubuntu_bionic-20191216 - ceph_daemon: &ceph_daemon docker.io/openstackhelm/ceph-daemon:ubuntu_bionic-20210902 + ceph_daemon: &ceph_daemon docker.io/openstackhelm/ceph-daemon:ubuntu_bionic-20200521 ceph-utility: &ceph-utility quay.io/airshipit/porthole-ceph-utility:e7a6644b3af8bddd94d20ca35f388ae605203416-ubuntu_bionic @@ -855,15 +866,15 @@ data: curator: &curator docker.io/bobrik/curator:5.8.1 - deckhand: &deckhand quay.io/airshipit/deckhand:90f653bc0fa9f2c910d05a3c00d2c339c064638d-ubuntu_xenial + deckhand: &deckhand quay.io/airshipit/deckhand:5cd799cc5d04527ac782270008ff647b3779ff05-ubuntu_bionic - dep_check: &dep_check quay.io/stackanetes/kubernetes-entrypoint:v0.3.1 + dep_check: &dep_check quay.io/airshipit/kubernetes-entrypoint:v1.0.0 - drydock: &drydock quay.io/airshipit/drydock:dfe7c0508d27f517bf29cd2f37b7f07b112edb4e + drydock: &drydock quay.io/airshipit/drydock:aa0cf8c8d09ad37b8ebcce677064e1b3b2211758-ubuntu_bionic elasticsearch: &elasticsearch docker.io/openstackhelm/elasticsearch-s3:7_1_0-20191119 - etcd: &etcd quay.io/coreos/etcd:v3.4.8 + etcd: &etcd quay.io/coreos/etcd:v3.4.15 etcdctl: &etcdctl-utility quay.io/airshipit/porthole-etcdctl-utility:e7a6644b3af8bddd94d20ca35f388ae605203416-ubuntu_bionic @@ -889,35 +900,34 @@ data: ingress_error_pages_404: &ingress_error_pages_404 gcr.io/google-containers/ingress-gce-404-server-with-metrics-amd64:v1.6.0@sha256:d83d8a481145d0eb71f8bd71ae236d1c6a931dd3bdcaf80919a8ec4a4d8aff74 - ingress_controller_mariadb: &ingress_controller_mariadb quay.io/kubernetes-ingress-controller/nginx-ingress-controller:0.32.0 + ingress_controller_mariadb: &ingress_controller_mariadb k8s.gcr.io/ingress-nginx/controller:v0.48.1 k8s-keystone-auth: &k8s-keystone-auth docker.io/k8scloudprovider/k8s-keystone-auth:v1.18.0 - kibana: &kibana docker.elastic.co/kibana/kibana-oss:7.9.2 + kibana: &kibana docker.elastic.co/kibana/kibana-oss:7.1.0 libvirt: &libvirt docker.io/openstackhelm/libvirt:ubuntu_bionic-20210227 - mariadb_db: &mariadb_db docker.io/openstackhelm/mariadb:10.2.18 + mariadb_db: &mariadb_db docker.io/openstackhelm/mariadb:ubuntu_xenial-20200811 - maas_rack_controller: &maas_rack_controller quay.io/airshipit/maas-rack-controller:840b482373df163ba088b91c278f2a58fd599b7b + maas_rack_controller: &maas_rack_controller quay.io/airshipit/maas-rack-controller:94e55069dc17606e0c3b585d7e901ee0bf372f29 - maas_region_controller: &maas_region_controller quay.io/airshipit/maas-region-controller:840b482373df163ba088b91c278f2a58fd599b7b + maas_region_controller: &maas_region_controller quay.io/airshipit/maas-region-controller:94e55069dc17606e0c3b585d7e901ee0bf372f29 maas_ingress: &maas_ingress docker-prod-local.artifactory.mirantis.com/mirantis/kubernetes-ingress-nginx/nginx-ingress-controller-amd64@sha256:fe510f97b02566e21685b7b108422370ca67a8a44099ce7e968a778c0ba06e0b memcached: &memcached docker.io/library/memcached:1.6.6-alpine #mos_cinder: &mos_cinder openstackhelm/cinder:stein-ubuntu_bionic-20200513 mos_cinder: &mos_cinder docker.io/openstackhelm/cinder:train-ubuntu_bionic-20200612 - mos_cinder_storage_init: &mos_cinder_storage_init docker.io/openstackhelm/ceph-config-helper:ubuntu_bionic-20200416 + mos_cinder_storage_init: &mos_cinder_storage_init docker.io/openstackhelm/ceph-config-helper:ubuntu_bionic-20220603 #mos_glance: &mos_glance openstackhelm/glance:stein-ubuntu_bionic-20200513 mos_glance: &mos_glance docker.io/openstackhelm/glance:train-ubuntu_bionic-20200612 - #mos_heat: &mos_heat docker.io/deepakdt/heat:stein-ubuntu_bionic-taas - mos_heat: &mos_heat docker.io/openstackhelm/heat:train-ubuntu_bionic-20200612 + mos_heat: &mos_heat docker.io/openstackhelm/heat:stein-ubuntu_bionic mos_heat_nova: &mos_heat_nova docker.io/openstackhelm/heat:train-ubuntu_bionic-20200612 - mos_horizon: &mos_horizon docker.io/openstackhelm/horizon:train-ubuntu_bionic-20200612 + mos_horizon: &mos_horizon docker.io/openstackhelm/horizon:train-ubuntu_bionic mos_keystone: &mos_keystone docker.io/openstackhelm/keystone:train-ubuntu_bionic-20200612 #mos_neutron: &mos_neutron docker.io/imarijitbose/stein_neutron_bionic @@ -933,22 +943,25 @@ data: nova_spiceproxy: &nova_spiceproxy docker.io/openstackhelm/nova:train-ubuntu_bionic-20200612 #openvswitch: &openvswitch docker.io/deepakdt/openvswitch:ovs2.11.1-dpdk18.11.3-ubuntu_bionic-dpdk - openvswitch: &openvswitch docker.io/openstackhelm/openvswitch:ubuntu_bionic-20200722 + openvswitch: &openvswitch docker.io/openstackhelm/openvswitch:ubuntu_bionic-dpdk-20220725 openstack-utility: &openstack-utility quay.io/airshipit/porthole-openstack-utility:e7a6644b3af8bddd94d20ca35f388ae605203416-ubuntu_bionic pegleg: &pegleg quay.io/airshipit/pegleg@sha256:0ca3b708c37425e4e05627443dbd39d2ed27cf06193d2cc3bcb5b985b260d79d + + mos_placement: &mos_placement docker.io/openstackhelm/placement:periodic_train-ubuntu_bionic-20220309 + nc-swissknife: &nc-swissknife quay.io/airshipit/pegleg@sha256:0ca3b708c37425e4e05627443dbd39d2ed27cf06193d2cc3bcb5b985b260d79d patroni: &patroni docker-prod-local.artifactory.mirantis.com/nc/patroni:9.6.15-bionic-1567439806207 - postgres: &postgres docker-prod-local.artifactory.mirantis.com/nc/postgresql:9.6.15-debian-1566552796302 + postgres: &postgres docker.io/postgres:9.6 promenade: &promenade quay.io/airshipit/promenade:b65930f205b77f28507dee9296aead00e24f2a18 divingbell: &divingbell docker.io/ubuntu:16.04 prometheus: &prometheus docker.io/prom/prometheus:v2.12.0 - prometheus_elasticsearch_exporter: &prometheus_elasticsearch_exporter docker.io/justwatch/elasticsearch_exporter:1.0.1 + prometheus_elasticsearch_exporter: &prometheus_elasticsearch_exporter docker.io/justwatch/elasticsearch_exporter:1.1.0 prometheus_fluentd_exporter: &prometheus_fluentd_exporter docker.io/bitnami/fluentd-exporter:0.2.0 prometheus_memcached_exporter: &prometheus_memcached_exporter docker.io/prom/memcached-exporter:v0.4.1 prometheus_mysql_exporter: &prometheus_mysql_exporter docker.io/prom/mysqld-exporter:v0.10.0 @@ -958,12 +971,12 @@ data: rabbitmq_mgmt: &rabbitmq_mgmt docker.io/library/rabbitmq:3.7.15-management rabbitmq: &rabbitmq docker.io/library/rabbitmq:3.7.15 rabbitmq_exporter: &rabbitmq_exporter docker.io/kbudde/rabbitmq-exporter:v1.0.0-RC7.1 - rally_test: &rally_test docker.io/xrally/xrally-openstack:1.3.0 + rally_test: &rally_test docker.io/xrally/xrally-openstack:2.0.0 #rbd_provisioner: &rbd_provisioner docker.io/openstackhelm/ceph-rbd-provisioner:ubuntu_bionic-20191216 rbd_provisioner: &rbd_provisioner docker.io/openstackhelm/ceph-rbd-provisioner:ubuntu_bionic-20200521 selenium_tests: &selenium_tests docker.io/openstackhelm/osh-selenium:ubuntu_bionic-20191017 shipyard: &shipyard quay.io/airshipit/shipyard:0b29f89d3fc284fe483c58f102574c687034468d-ubuntu_xenial - sstream_cache: &sstream_cache quay.io/airshipit/sstream-cache:03ebbaaca3f38ab49a5993b506761a4abfd19d89 + sstream_cache: &sstream_cache quay.io/airshipit/sstream-cache:3accf71685ed980ed8c5c07fd8c59306c012dcd2 #storage_init: &storage_init docker.io/openstackhelm/ceph-config-helper:ubuntu_bionic-20191216 storage_init: &storage_init docker.io/openstackhelm/ceph-config-helper:ubuntu_bionic-20200521 @@ -985,7 +998,7 @@ data: kubernetes_test: &kubernetes_test docker.io/python:3.6 kubernetes_pause: &kubernetes_pause gcr.io/google_containers/pause-amd64:3.1 - grafana: &grafana docker.io/grafana/grafana:6.2.0 + grafana: &grafana docker.io/grafana/grafana:7.3.6 # TODO: Move this under the images_refs.images header for consistency keystone: &ref_keystone @@ -1309,6 +1322,15 @@ data: openvswitch_db_server: *openvswitch openvswitch_vswitchd: *openvswitch dep_check: *dep_check + placement: + bootstrap: *mos_heat + <<: *ref_keystone + db_migrate: *mos_placement + db_drop: *mos_heat + db_init: *mos_heat + dep_check: *dep_check + placement: *mos_placement + placement_db_sync: *mos_placement rabbitmq: prometheus_rabbitmq_exporter: *rabbitmq_exporter prometheus_rabbitmq_exporter_helm_tests: *mos_heat @@ -1722,7 +1744,7 @@ data: - main gpgkey: "" named: - runtime: containerd=1.5.2-0ubuntu1~18.04.2 + runtime: containerd=1.5.5-0ubuntu3~18.04.2 socat: socat unnamed: - bsd-mailx @@ -1744,5 +1766,6 @@ data: # NC release to reboot the nodes after the completion of the Shipyard site-update. In # the MOP update, you should also link to the following wiki page: # https://wiki.web.att.com/display/CCPdev/i40e+Driver+upgrades - location: https://netactuate.dl.sourceforge.net/project/e1000/i40e%20stable/2.12.6/i40e-2.12.6.tar.gz + #location: https://netactuate.dl.sourceforge.net/project/e1000/i40e%20stable/2.12.6/i40e-2.12.6.tar.gz + location: https://sourceforge.net/projects/e1000/files/unsupported/i40e%20unsupported/i40e-2.12.6.3/i40e-2.12.6.3.tar.gz ... diff --git a/type/cruiser/software/charts/ucp/core/scaled-charts.yaml b/type/cruiser/software/charts/ucp/core/scaled-charts.yaml index c565de28f..22682b271 100644 --- a/type/cruiser/software/charts/ucp/core/scaled-charts.yaml +++ b/type/cruiser/software/charts/ucp/core/scaled-charts.yaml @@ -87,5 +87,5 @@ data: values: pod: replicas: - server: 3 + server: 1 ... diff --git a/type/cruiser/software/config/endpoints.yaml b/type/cruiser/software/config/endpoints.yaml index d64144f48..18bc2a1b5 100644 --- a/type/cruiser/software/config/endpoints.yaml +++ b/type/cruiser/software/config/endpoints.yaml @@ -285,6 +285,7 @@ data: default: 8088 public: 443 oslo_db: + namespace: openstack hosts: default: mariadb discovery: mariadb-discovery diff --git a/type/cruiser/software/config/service_accounts.yaml b/type/cruiser/software/config/service_accounts.yaml index f704e82c7..7dce22c39 100644 --- a/type/cruiser/software/config/service_accounts.yaml +++ b/type/cruiser/software/config/service_accounts.yaml @@ -32,6 +32,8 @@ metadata: - path: .osh.nova.nova.region_name - path: .osh.nova.test.region_name - path: .osh.nova.placement.region_name + - path: .osh.placement.placement.region_name + - path: .osh.placement.test.region_name - path: .osh.barbican.barbican.region_name - path: .osh.horizon.admin.region_name data: @@ -159,6 +161,25 @@ data: oslo_messaging: neutron: username: neutron-rabbitmq-user + placement: + placement: + role: admin + username: placement + project_name: service + user_domain_name: default + project_domain_name: default + test: + role: admin + username: placement-test + project_name: test + user_domain_name: service + project_domain_name: service + oslo_db: + username: placement + database: placement + oslo_messaging: + placement: + username: placement-rabbitmq-user nova: nova: role: admin @@ -190,6 +211,8 @@ data: oslo_messaging: nova: username: nova-rabbitmq-user + placement: + username: nova-rabbitmq-user horizon: admin: username: admin