mirror of
				https://github.com/prometheus/node_exporter.git
				synced 2025-08-20 18:33:52 -07:00 
			
		
		
		
	Migrated away from deprecated Grafonnet library. This replaces panels using Angular JS which are disabled by default in Grafana 11 and will be unsupported in Grafana 12. Fixes #3046 --------- Signed-off-by: Tom <12222103+critchtionary@users.noreply.github.com>
		
			
				
	
	
		
			481 lines
		
	
	
		
			29 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
			
		
		
	
	
			481 lines
		
	
	
		
			29 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
| local grafana = import 'github.com/grafana/grafonnet/gen/grafonnet-latest/main.libsonnet';
 | |
| local dashboard = grafana.dashboard;
 | |
| local variable = dashboard.variable;
 | |
| local row = grafana.panel.row;
 | |
| local prometheus = grafana.query.prometheus;
 | |
| 
 | |
| local timeSeriesPanel = grafana.panel.timeSeries;
 | |
| local tsOptions = timeSeriesPanel.options;
 | |
| local tsStandardOptions = timeSeriesPanel.standardOptions;
 | |
| local tsQueryOptions = timeSeriesPanel.queryOptions;
 | |
| local tsCustom = timeSeriesPanel.fieldConfig.defaults.custom;
 | |
| local tsLegend = tsOptions.legend;
 | |
| 
 | |
| local c = import '../config.libsonnet';
 | |
| 
 | |
| local datasource = variable.datasource.new(
 | |
|   'datasource', 'prometheus'
 | |
| );
 | |
| 
 | |
| local tsCommonPanelOptions =
 | |
|   variable.query.withDatasourceFromVariable(datasource)
 | |
|   + tsCustom.stacking.withMode('normal')
 | |
|   + tsCustom.withFillOpacity(100)
 | |
|   + tsCustom.withShowPoints('never')
 | |
|   + tsLegend.withShowLegend(false)
 | |
|   + tsOptions.tooltip.withMode('multi')
 | |
|   + tsOptions.tooltip.withSort('desc');
 | |
| 
 | |
| local CPUUtilisation =
 | |
|   timeSeriesPanel.new(
 | |
|     'CPU Utilisation',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('percentunit');
 | |
| 
 | |
| local CPUSaturation =
 | |
|   // TODO: Is this a useful panel? At least there should be some explanation how load
 | |
|   // average relates to the "CPU saturation" in the title.
 | |
|   timeSeriesPanel.new(
 | |
|     'CPU Saturation (Load1 per CPU)',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('percentunit');
 | |
| 
 | |
| local memoryUtilisation =
 | |
|   timeSeriesPanel.new(
 | |
|     'Memory Utilisation',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('percentunit');
 | |
| 
 | |
| local memorySaturation =
 | |
|   timeSeriesPanel.new(
 | |
|     'Memory Saturation (Major Page Faults)',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('rds');
 | |
| 
 | |
| local networkOverrides = tsStandardOptions.withOverrides(
 | |
|   [
 | |
|     tsStandardOptions.override.byRegexp.new('/Transmit/')
 | |
|     + tsStandardOptions.override.byRegexp.withPropertiesFromOptions(
 | |
|       tsCustom.withTransform('negative-Y')
 | |
|     ),
 | |
|   ]
 | |
| );
 | |
| 
 | |
| local networkUtilisation =
 | |
|   timeSeriesPanel.new(
 | |
|     'Network Utilisation (Bytes Receive/Transmit)',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('Bps')
 | |
|   + networkOverrides;
 | |
| 
 | |
| local networkSaturation =
 | |
|   timeSeriesPanel.new(
 | |
|     'Network Saturation (Drops Receive/Transmit)',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('Bps')
 | |
|   + networkOverrides;
 | |
| 
 | |
| local diskIOUtilisation =
 | |
|   timeSeriesPanel.new(
 | |
|     'Disk IO Utilisation',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('percentunit');
 | |
| 
 | |
| local diskIOSaturation =
 | |
|   timeSeriesPanel.new(
 | |
|     'Disk IO Saturation',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('percentunit');
 | |
| 
 | |
| local diskSpaceUtilisation =
 | |
|   timeSeriesPanel.new(
 | |
|     'Disk Space Utilisation',
 | |
|   )
 | |
|   + tsCommonPanelOptions
 | |
|   + tsStandardOptions.withUnit('percentunit');
 | |
| 
 | |
| {
 | |
|   _clusterVariable::
 | |
|     variable.query.new('cluster')
 | |
|     + variable.query.withDatasourceFromVariable(datasource)
 | |
|     + variable.query.queryTypes.withLabelValues(
 | |
|       $._config.clusterLabel,
 | |
|       'node_time_seconds',
 | |
|     )
 | |
|     + (if $._config.showMultiCluster then variable.query.generalOptions.showOnDashboard.withLabelAndValue() else variable.query.generalOptions.showOnDashboard.withNothing())
 | |
|     + variable.query.refresh.onTime()
 | |
|     + variable.query.selectionOptions.withIncludeAll(false)
 | |
|     + variable.query.withSort(asc=true),
 | |
| 
 | |
|   grafanaDashboards+:: {
 | |
|                          'node-rsrc-use.json':
 | |
|                            dashboard.new(
 | |
|                              '%sUSE Method / Node' % $._config.dashboardNamePrefix,
 | |
|                            )
 | |
|                            + dashboard.time.withFrom('now-1h')
 | |
|                            + dashboard.withTags($._config.dashboardTags)
 | |
|                            + dashboard.withTimezone('utc')
 | |
|                            + dashboard.withRefresh('30s')
 | |
|                            + dashboard.graphTooltip.withSharedCrosshair()
 | |
|                            + dashboard.withUid(std.md5('node-rsrc-use.json'))
 | |
|                            + dashboard.withVariables([
 | |
|                              datasource,
 | |
|                              $._clusterVariable,
 | |
|                              variable.query.new('instance')
 | |
|                              + variable.query.withDatasourceFromVariable(datasource)
 | |
|                              + variable.query.queryTypes.withLabelValues(
 | |
|                                'instance',
 | |
|                                'node_exporter_build_info{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}' % $._config,
 | |
|                              )
 | |
|                              + variable.query.refresh.onTime()
 | |
|                              + variable.query.withSort(asc=true),
 | |
|                            ])
 | |
|                            + dashboard.withPanels(
 | |
|                              grafana.util.grid.makeGrid([
 | |
|                                row.new('CPU')
 | |
|                                + row.withPanels([
 | |
|                                  CPUUtilisation + tsQueryOptions.withTargets([prometheus.new('$datasource', 'instance:node_cpu_utilisation:rate%(rateInterval)s{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('Utilisation')]),
 | |
|                                  CPUSaturation + tsQueryOptions.withTargets([prometheus.new('$datasource', 'instance:node_load1_per_cpu:ratio{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('Saturation')]),
 | |
|                                ]),
 | |
|                                row.new('Memory')
 | |
|                                + row.withPanels([
 | |
|                                  memoryUtilisation + tsQueryOptions.withTargets([prometheus.new('$datasource', 'instance:node_memory_utilisation:ratio{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('Utilisation')]),
 | |
|                                  memorySaturation + tsQueryOptions.withTargets([prometheus.new('$datasource', 'instance:node_vmstat_pgmajfault:rate%(rateInterval)s{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('Major page Faults')]),
 | |
|                                ]),
 | |
|                                row.new('Network')
 | |
|                                + row.withPanels([
 | |
|                                  networkUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new('$datasource', 'instance:node_network_receive_bytes_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('Receive'),
 | |
|                                    prometheus.new('$datasource', 'instance:node_network_transmit_bytes_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('Transmit'),
 | |
|                                  ]),
 | |
|                                  networkSaturation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new('$datasource', 'instance:node_network_receive_drop_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('Receive'),
 | |
|                                    prometheus.new('$datasource', 'instance:node_network_transmit_drop_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('Transmit'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                                row.new('Disk IO')
 | |
|                                + row.withPanels([
 | |
|                                  diskIOUtilisation + tsQueryOptions.withTargets([prometheus.new('$datasource', 'instance_device:node_disk_io_time_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('{{device}}')]),
 | |
|                                  diskIOSaturation + tsQueryOptions.withTargets([prometheus.new('$datasource', 'instance_device:node_disk_io_time_weighted_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s, instance="$instance", %(clusterLabel)s="$cluster"} != 0' % $._config) + prometheus.withLegendFormat('{{device}}')]),
 | |
|                                ]),
 | |
|                              ], panelWidth=12, panelHeight=7)
 | |
|                              + grafana.util.grid.makeGrid([
 | |
|                                row.new('Disk Space')
 | |
|                                + row.withPanels([
 | |
|                                  diskSpaceUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sort_desc(1 -
 | |
|                                          (
 | |
|                                            max without (mountpoint, fstype) (node_filesystem_avail_bytes{%(nodeExporterSelector)s, fstype!="", instance="$instance", %(clusterLabel)s="$cluster"})
 | |
|                                            /
 | |
|                                            max without (mountpoint, fstype) (node_filesystem_size_bytes{%(nodeExporterSelector)s, fstype!="", instance="$instance", %(clusterLabel)s="$cluster"})
 | |
|                                          ) != 0
 | |
|                                        )
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{device}}'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                              ], panelWidth=24, panelHeight=7, startY=34),
 | |
|                            ),
 | |
|                          'node-cluster-rsrc-use.json':
 | |
|                            dashboard.new(
 | |
|                              '%sUSE Method / Cluster' % $._config.dashboardNamePrefix,
 | |
|                            )
 | |
|                            + dashboard.time.withFrom('now-1h')
 | |
|                            + dashboard.withTags($._config.dashboardTags)
 | |
|                            + dashboard.withTimezone('utc')
 | |
|                            + dashboard.withRefresh('30s')
 | |
|                            + dashboard.graphTooltip.withSharedCrosshair()
 | |
|                            + dashboard.withUid(std.md5('node-cluster-rsrc-use.json'))
 | |
|                            + dashboard.withVariables([
 | |
|                              datasource,
 | |
|                              $._clusterVariable,
 | |
|                              variable.query.withDatasourceFromVariable(datasource)
 | |
|                              + variable.query.refresh.onTime()
 | |
|                              + variable.query.withSort(asc=true),
 | |
|                            ])
 | |
|                            + dashboard.withPanels(
 | |
|                              grafana.util.grid.makeGrid([
 | |
|                                row.new('CPU')
 | |
|                                + row.withPanels([
 | |
|                                  CPUUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        ((
 | |
|                                          instance:node_cpu_utilisation:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}
 | |
|                                          *
 | |
|                                          instance:node_num_cpu:sum{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}
 | |
|                                        ) != 0 )
 | |
|                                        / scalar(sum(instance:node_num_cpu:sum{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}))
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }}'),
 | |
|                                  ]),
 | |
|                                  CPUSaturation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        (
 | |
|                                          instance:node_load1_per_cpu:ratio{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}
 | |
|                                          / scalar(count(instance:node_load1_per_cpu:ratio{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}))
 | |
|                                        )  != 0
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }}'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                                row.new('Memory')
 | |
|                                + row.withPanels([
 | |
|                                  memoryUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        (
 | |
|                                          instance:node_memory_utilisation:ratio{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}
 | |
|                                          / scalar(count(instance:node_memory_utilisation:ratio{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}))
 | |
|                                        ) != 0
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }}'),
 | |
|                                  ]),
 | |
|                                  memorySaturation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      'instance:node_vmstat_pgmajfault:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}' % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }}'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                                row.new('Network')
 | |
|                                + row.withPanels([
 | |
|                                  networkUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      'instance:node_network_receive_bytes_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"} != 0' % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }} Receive'),
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      'instance:node_network_transmit_bytes_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"} != 0' % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }} Transmit'),
 | |
|                                  ]),
 | |
|                                  networkSaturation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      'instance:node_network_receive_drop_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"} != 0' % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }} Receive'),
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      'instance:node_network_transmit_drop_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"} != 0' % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }} Transmit'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                                row.new('Disk IO')
 | |
|                                + row.withPanels([
 | |
|                                  diskIOUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        instance_device:node_disk_io_time_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}
 | |
|                                        / scalar(count(instance_device:node_disk_io_time_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}))
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }} {{device}}'),
 | |
|                                  ]),
 | |
|                                  diskIOSaturation + tsQueryOptions.withTargets([prometheus.new(
 | |
|                                    '$datasource',
 | |
|                                    |||
 | |
|                                      instance_device:node_disk_io_time_weighted_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}
 | |
|                                      / scalar(count(instance_device:node_disk_io_time_weighted_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s, %(clusterLabel)s="$cluster"}))
 | |
|                                    ||| % $._config
 | |
|                                  ) + prometheus.withLegendFormat('{{ instance }} {{device}}')]),
 | |
|                                ]),
 | |
|                              ], panelWidth=12, panelHeight=7)
 | |
|                              + grafana.util.grid.makeGrid([
 | |
|                                row.new('Disk Space')
 | |
|                                + row.withPanels([
 | |
|                                  diskSpaceUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum without (device) (
 | |
|                                          max without (fstype, mountpoint) ((
 | |
|                                            node_filesystem_size_bytes{%(nodeExporterSelector)s, %(fsSelector)s, %(fsMountpointSelector)s, %(clusterLabel)s="$cluster"}
 | |
|                                            -
 | |
|                                            node_filesystem_avail_bytes{%(nodeExporterSelector)s, %(fsSelector)s, %(fsMountpointSelector)s, %(clusterLabel)s="$cluster"}
 | |
|                                          ) != 0)
 | |
|                                        )
 | |
|                                        / scalar(sum(max without (fstype, mountpoint) (node_filesystem_size_bytes{%(nodeExporterSelector)s, %(fsSelector)s, %(fsMountpointSelector)s, %(clusterLabel)s="$cluster"})))
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{ instance }}'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                              ], panelWidth=24, panelHeight=7, startY=34),
 | |
|                            ),
 | |
|                        } +
 | |
|                        if $._config.showMultiCluster then {
 | |
|                          'node-multicluster-rsrc-use.json':
 | |
|                            dashboard.new(
 | |
|                              '%sUSE Method / Multi-cluster' % $._config.dashboardNamePrefix,
 | |
|                            )
 | |
|                            + dashboard.time.withFrom('now-1h')
 | |
|                            + dashboard.withTags($._config.dashboardTags)
 | |
|                            + dashboard.withTimezone('utc')
 | |
|                            + dashboard.withRefresh('30s')
 | |
|                            + dashboard.graphTooltip.withSharedCrosshair()
 | |
|                            + dashboard.withUid(std.md5('node-multicluster-rsrc-use.json'))
 | |
|                            + dashboard.withVariables([
 | |
|                              datasource,
 | |
|                              variable.query.withDatasourceFromVariable(datasource)
 | |
|                              + variable.query.refresh.onTime()
 | |
|                              + variable.query.withSort(asc=true),
 | |
|                            ])
 | |
|                            + dashboard.withPanels(
 | |
|                              grafana.util.grid.makeGrid([
 | |
|                                row.new('CPU')
 | |
|                                + row.withPanels([
 | |
|                                  CPUUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum(
 | |
|                                          ((
 | |
|                                            instance:node_cpu_utilisation:rate%(rateInterval)s{%(nodeExporterSelector)s}
 | |
|                                            *
 | |
|                                            instance:node_num_cpu:sum{%(nodeExporterSelector)s}
 | |
|                                          ) != 0)
 | |
|                                          / scalar(sum(instance:node_num_cpu:sum{%(nodeExporterSelector)s}))
 | |
|                                        ) by (%(clusterLabel)s)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}}'),
 | |
|                                  ]),
 | |
|                                  CPUSaturation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum((
 | |
|                                            instance:node_load1_per_cpu:ratio{%(nodeExporterSelector)s}
 | |
|                                            / scalar(count(instance:node_load1_per_cpu:ratio{%(nodeExporterSelector)s}))
 | |
|                                        ) != 0) by (%(clusterLabel)s)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}}'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                                row.new('Memory')
 | |
|                                + row.withPanels([
 | |
|                                  memoryUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum((
 | |
|                                            instance:node_memory_utilisation:ratio{%(nodeExporterSelector)s}
 | |
|                                            / scalar(count(instance:node_memory_utilisation:ratio{%(nodeExporterSelector)s}))
 | |
|                                        ) != 0) by (%(clusterLabel)s)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}}'),
 | |
|                                  ]),
 | |
|                                  memorySaturation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum((
 | |
|                                            instance:node_vmstat_pgmajfault:rate%(rateInterval)s{%(nodeExporterSelector)s}
 | |
|                                        ) != 0) by (%(clusterLabel)s)
 | |
|                                      |||
 | |
|                                      % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}}'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                                row.new('Network')
 | |
|                                + row.withPanels([
 | |
|                                  networkUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum((
 | |
|                                            instance:node_network_receive_bytes_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s}
 | |
|                                        ) != 0) by (%(clusterLabel)s)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}} Receive'),
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum((
 | |
|                                            instance:node_network_transmit_bytes_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s}
 | |
|                                        ) != 0) by (%(clusterLabel)s)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}} Transmit'),
 | |
|                                  ]),
 | |
|                                  networkSaturation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum((
 | |
|                                            instance:node_network_receive_drop_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s}
 | |
|                                        ) != 0) by (%(clusterLabel)s)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}} Receive'),
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum((
 | |
|                                            instance:node_network_transmit_drop_excluding_lo:rate%(rateInterval)s{%(nodeExporterSelector)s}
 | |
|                                        ) != 0) by (%(clusterLabel)s)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}} Transmit'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                                row.new('Disk IO')
 | |
|                                + row.withPanels([
 | |
|                                  diskIOUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum((
 | |
|                                            instance_device:node_disk_io_time_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s}
 | |
|                                            / scalar(count(instance_device:node_disk_io_time_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s}))
 | |
|                                        ) != 0) by (%(clusterLabel)s, device)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}} {{device}}'),
 | |
|                                  ]),
 | |
|                                  diskIOSaturation + tsQueryOptions.withTargets([prometheus.new(
 | |
|                                    '$datasource',
 | |
|                                    |||
 | |
|                                      sum((
 | |
|                                        instance_device:node_disk_io_time_weighted_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s}
 | |
|                                        / scalar(count(instance_device:node_disk_io_time_weighted_seconds:rate%(rateInterval)s{%(nodeExporterSelector)s}))
 | |
|                                      ) != 0) by (%(clusterLabel)s, device)
 | |
|                                    ||| % $._config
 | |
|                                  ) + prometheus.withLegendFormat('{{%(clusterLabel)s}} {{device}}')]),
 | |
|                                ]),
 | |
| 
 | |
|                              ], panelWidth=12, panelHeight=7)
 | |
|                              + grafana.util.grid.makeGrid([
 | |
|                                row.new('Disk Space')
 | |
|                                + row.withPanels([
 | |
|                                  diskSpaceUtilisation + tsQueryOptions.withTargets([
 | |
|                                    prometheus.new(
 | |
|                                      '$datasource',
 | |
|                                      |||
 | |
|                                        sum (
 | |
|                                          sum without (device) (
 | |
|                                            max without (fstype, mountpoint, instance, pod) ((
 | |
|                                              node_filesystem_size_bytes{%(nodeExporterSelector)s, %(fsSelector)s, %(fsMountpointSelector)s} - node_filesystem_avail_bytes{%(nodeExporterSelector)s, %(fsSelector)s, %(fsMountpointSelector)s}
 | |
|                                            ) != 0)
 | |
|                                          )
 | |
|                                          / scalar(sum(max without (fstype, mountpoint) (node_filesystem_size_bytes{%(nodeExporterSelector)s, %(fsSelector)s, %(fsMountpointSelector)s})))
 | |
|                                        ) by (%(clusterLabel)s)
 | |
|                                      ||| % $._config
 | |
|                                    ) + prometheus.withLegendFormat('{{%(clusterLabel)s}}'),
 | |
|                                  ]),
 | |
|                                ]),
 | |
|                              ], panelWidth=24, panelHeight=7, startY=34),
 | |
|                            ),
 | |
|                        } else {},
 | |
| }
 |