batch-shipyard/heimdall/batch_shipyard_dashboard.json

5268 строки
138 KiB
JSON

{
"__requires": [
{
"type": "grafana",
"id": "grafana",
"name": "Grafana",
"version": "5.1.3"
},
{
"type": "panel",
"id": "graph",
"name": "Graph",
"version": "5.0.0"
},
{
"type": "datasource",
"id": "prometheus",
"name": "Prometheus",
"version": "5.0.0"
},
{
"type": "panel",
"id": "singlestat",
"name": "Singlestat",
"version": "5.0.0"
}
],
"annotations": {
"list": [
{
"builtIn": 1,
"datasource": "-- Grafana --",
"enable": true,
"hide": true,
"iconColor": "rgba(0, 211, 255, 1)",
"limit": 100,
"name": "Annotations & Alerts",
"showIn": 0,
"type": "dashboard"
}
]
},
"description": "Dashboard for Batch Shipyard resources",
"editable": true,
"gnetId": null,
"graphTooltip": 0,
"id": null,
"iteration": 1528233885724,
"links": [],
"panels": [
{
"collapsed": false,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 0
},
"id": 286,
"panels": [],
"title": "Aggregate Overview for Resource",
"type": "row"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": false,
"colors": [
"rgba(245, 54, 54, 0.9)",
"rgba(237, 129, 40, 0.89)",
"rgba(50, 172, 45, 0.97)"
],
"datasource": "Prometheus",
"description": "Total number of nodes",
"format": "short",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": false,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 3,
"w": 2,
"x": 0,
"y": 1
},
"id": 289,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 4,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": false
},
"tableColumn": "",
"targets": [
{
"expr": "count(count(node_cpu_seconds_total{job=~\"$job\"}) without (cpu, mode))",
"format": "time_series",
"intervalFactor": 1,
"refId": "B"
}
],
"thresholds": "",
"title": "Nodes",
"type": "singlestat",
"valueFontSize": "50%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": false,
"colors": [
"rgba(245, 54, 54, 0.9)",
"rgba(237, 129, 40, 0.89)",
"rgba(50, 172, 45, 0.97)"
],
"datasource": "Prometheus",
"decimals": 1,
"description": "System uptime",
"format": "s",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": false,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 2,
"w": 4,
"x": 2,
"y": 1
},
"hideTimeOverride": true,
"id": 290,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"nullPointMode": "null",
"nullText": null,
"postfix": "s",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": false
},
"tableColumn": "",
"targets": [
{
"expr": "avg(node_time_seconds{job=~\"$job\"}) - avg(node_boot_time_seconds{job=~\"$job\"})",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"refId": "A",
"step": 1800
}
],
"thresholds": "",
"title": "Average Uptime",
"transparent": false,
"type": "singlestat",
"valueFontSize": "50%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": false,
"colors": [
"rgba(245, 54, 54, 0.9)",
"rgba(237, 129, 40, 0.89)",
"rgba(50, 172, 45, 0.97)"
],
"datasource": "Prometheus",
"decimals": 2,
"description": "Total Memory",
"format": "bytes",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": false,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 2,
"w": 4,
"x": 6,
"y": 1
},
"id": 288,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 4,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "70%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": false
},
"tableColumn": "",
"targets": [
{
"expr": "sum(node_memory_MemTotal_bytes{job=~\"$job\"})",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"refId": "A",
"step": 900
}
],
"thresholds": "",
"title": "Total Memory",
"type": "singlestat",
"valueFontSize": "50%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"aliasColors": {
"Recv_bytes_eth2": "#7EB26D",
"Recv_bytes_lo": "#0A50A1",
"Recv_drop_eth2": "#6ED0E0",
"Recv_drop_lo": "#E0F9D7",
"Recv_errs_eth2": "#BF1B00",
"Recv_errs_lo": "#CCA300",
"Trans_bytes_eth2": "#7EB26D",
"Trans_bytes_lo": "#0A50A1",
"Trans_drop_eth2": "#6ED0E0",
"Trans_drop_lo": "#E0F9D7",
"Trans_errs_eth2": "#BF1B00",
"Trans_errs_lo": "#CCA300",
"recv_bytes_lo": "#0A50A1",
"recv_drop_eth0": "#99440A",
"recv_drop_lo": "#967302",
"recv_errs_eth0": "#BF1B00",
"recv_errs_lo": "#890F02",
"trans_bytes_eth0": "#7EB26D",
"trans_bytes_lo": "#0A50A1",
"trans_drop_eth0": "#99440A",
"trans_drop_lo": "#967302",
"trans_errs_eth0": "#BF1B00",
"trans_errs_lo": "#890F02"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"description": "Aggregate Network traffic on all devices",
"fill": 4,
"gridPos": {
"h": 6,
"w": 6,
"x": 10,
"y": 1
},
"id": 300,
"legend": {
"alignAsTable": false,
"avg": false,
"current": false,
"hideEmpty": false,
"hideZero": false,
"max": false,
"min": false,
"rightSide": false,
"show": false,
"sort": "current",
"sortDesc": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*trans.*/",
"transform": "negative-Y"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(node_network_receive_bytes_total{job=~\"$job\"}[1m]))",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "receive",
"refId": "A",
"step": 240
},
{
"expr": "sum(rate(node_network_transmit_bytes_total{job=~\"$job\"}[1m]))",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "transmit",
"refId": "B",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Network Traffic",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"transparent": false,
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "bytes",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "pps",
"label": "",
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": false,
"colors": [
"rgba(50, 172, 45, 0.97)",
"rgba(237, 129, 40, 0.89)",
"rgba(245, 54, 54, 0.9)"
],
"datasource": "Prometheus",
"decimals": null,
"description": "Smallest free ephemeral disk space on a node",
"format": "bytes",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": false,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 2,
"w": 4,
"x": 16,
"y": 1
},
"id": 293,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 4,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": false
},
"tableColumn": "",
"targets": [
{
"expr": "min(node_filesystem_avail_bytes{device=\"/dev/sdb1\",job=~\"$job\"})",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"refId": "A",
"step": 900
}
],
"thresholds": "70,90",
"title": "Min Free Ephemeral FS Space",
"type": "singlestat",
"valueFontSize": "50%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": false,
"colors": [
"rgba(50, 172, 45, 0.97)",
"rgba(237, 129, 40, 0.89)",
"rgba(245, 54, 54, 0.9)"
],
"datasource": "Prometheus",
"decimals": null,
"description": "Smallest free root disk space on a node",
"format": "bytes",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": false,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 2,
"w": 4,
"x": 20,
"y": 1
},
"id": 294,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 4,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": false
},
"tableColumn": "",
"targets": [
{
"expr": "min(node_filesystem_avail_bytes{mountpoint=\"/\",job=~\"$job\"})",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"refId": "A",
"step": 900
}
],
"thresholds": "70,90",
"title": "Min Free Root FS Space",
"type": "singlestat",
"valueFontSize": "50%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": true,
"colors": [
"rgba(50, 172, 45, 0.97)",
"rgba(237, 129, 40, 0.89)",
"rgba(245, 54, 54, 0.9)"
],
"datasource": "Prometheus",
"decimals": null,
"description": "Core usage across all nodes",
"format": "percent",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": true,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 4,
"w": 4,
"x": 2,
"y": 3
},
"id": 282,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 2,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": true
},
"tableColumn": "",
"targets": [
{
"expr": "100 * (1 - avg(irate(node_cpu_seconds_total{mode=\"idle\",job=~\"$job\"}[1m])))",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"legendFormat": "",
"refId": "A",
"step": 900
}
],
"thresholds": "85,95",
"title": "CPU Usage",
"type": "singlestat",
"valueFontSize": "80%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": true,
"colors": [
"rgba(50, 172, 45, 0.97)",
"rgba(237, 129, 40, 0.89)",
"rgba(245, 54, 54, 0.9)"
],
"datasource": "Prometheus",
"decimals": 0,
"description": "Memory Used by all nodes",
"format": "percent",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": true,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 4,
"w": 4,
"x": 6,
"y": 3
},
"hideTimeOverride": false,
"id": 16,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 4,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": true
},
"tableColumn": "",
"targets": [
{
"expr": "100 * (sum(node_memory_MemTotal_bytes{job=~\"$job\"}) - sum(node_memory_MemAvailable_bytes{job=~\"$job\"})) / sum(node_memory_MemTotal_bytes{job=~\"$job\"})",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"refId": "B",
"step": 900
}
],
"thresholds": "80,90",
"title": "Memory Usage",
"type": "singlestat",
"valueFontSize": "80%",
"valueMaps": [],
"valueName": "current"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": true,
"colors": [
"rgba(50, 172, 45, 0.97)",
"rgba(237, 129, 40, 0.89)",
"rgba(245, 54, 54, 0.9)"
],
"datasource": "Prometheus",
"decimals": null,
"description": "Average used ephemeral FS",
"format": "percent",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": true,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 4,
"w": 4,
"x": 16,
"y": 3
},
"id": 291,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 4,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": true
},
"tableColumn": "",
"targets": [
{
"expr": "100 * ((sum(node_filesystem_size_bytes{device=\"/dev/sdb1\",job=~\"$job\"}) - sum(node_filesystem_avail_bytes{device=\"/dev/sdb1\",job=~\"$job\"})) / sum(node_filesystem_size_bytes{device=\"/dev/sdb1\",job=~\"$job\"}))",
"format": "time_series",
"intervalFactor": 1,
"refId": "A",
"step": 900
}
],
"thresholds": "80,90",
"title": "Ephemeral FS Usage",
"type": "singlestat",
"valueFontSize": "80%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": true,
"colors": [
"rgba(50, 172, 45, 0.97)",
"rgba(237, 129, 40, 0.89)",
"rgba(245, 54, 54, 0.9)"
],
"datasource": "Prometheus",
"decimals": null,
"description": "Average Used Root FS",
"format": "percent",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": true,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 4,
"w": 4,
"x": 20,
"y": 3
},
"id": 292,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 4,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": true
},
"tableColumn": "",
"targets": [
{
"expr": "100 * ((sum(node_filesystem_size_bytes{mountpoint=\"/\",job=~\"$job\"}) - sum(node_filesystem_avail_bytes{mountpoint=\"/\",job=~\"$job\"})) / sum(node_filesystem_size_bytes{mountpoint=\"/\",job=~\"$job\"}))",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"refId": "A",
"step": 900
}
],
"thresholds": "80,90",
"title": "Root FS Usage",
"type": "singlestat",
"valueFontSize": "80%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"cacheTimeout": null,
"colorBackground": false,
"colorValue": false,
"colors": [
"rgba(245, 54, 54, 0.9)",
"rgba(237, 129, 40, 0.89)",
"rgba(50, 172, 45, 0.97)"
],
"datasource": "Prometheus",
"description": "Total number of CPU cores",
"format": "short",
"gauge": {
"maxValue": 100,
"minValue": 0,
"show": false,
"thresholdLabels": false,
"thresholdMarkers": true
},
"gridPos": {
"h": 3,
"w": 2,
"x": 0,
"y": 4
},
"id": 287,
"interval": null,
"links": [],
"mappingType": 1,
"mappingTypes": [
{
"name": "value to text",
"value": 1
},
{
"name": "range to text",
"value": 2
}
],
"maxDataPoints": 100,
"minSpan": 4,
"nullPointMode": "null",
"nullText": null,
"postfix": "",
"postfixFontSize": "50%",
"prefix": "",
"prefixFontSize": "50%",
"rangeMaps": [
{
"from": "null",
"text": "N/A",
"to": "null"
}
],
"sparkline": {
"fillColor": "rgba(31, 118, 189, 0.18)",
"full": false,
"lineColor": "rgb(31, 120, 193)",
"show": false
},
"tableColumn": "",
"targets": [
{
"expr": "count(count(node_cpu_seconds_total{job=~\"$job\"}) without (mode))",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"refId": "A",
"step": 900
}
],
"thresholds": "",
"title": "Total Cores",
"type": "singlestat",
"valueFontSize": "50%",
"valueMaps": [
{
"op": "=",
"text": "N/A",
"value": "null"
}
],
"valueName": "current"
},
{
"collapsed": true,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 7
},
"id": 298,
"panels": [
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 2,
"description": "Core usage for containers",
"editable": true,
"error": false,
"fill": 0,
"grid": {},
"gridPos": {
"h": 13,
"w": 12,
"x": 0,
"y": 32
},
"height": "",
"id": 302,
"isNew": true,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideEmpty": false,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": null,
"sort": "current",
"sortDesc": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 2,
"links": [],
"nullPointMode": "connected",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(container_cpu_usage_seconds_total{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}[1m])) by (name, image, job, instance)",
"format": "time_series",
"hide": false,
"interval": "10s",
"intervalFactor": 1,
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
"metric": "container_cpu",
"refId": "A",
"step": 10
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Container Core Usage (1m avg)",
"tooltip": {
"msResolution": true,
"shared": true,
"sort": 2,
"value_type": "cumulative"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "none",
"label": "cores",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 2,
"description": "Container Memory Usage (Working Set Size)",
"editable": true,
"error": false,
"fill": 0,
"grid": {},
"gridPos": {
"h": 13,
"w": 12,
"x": 12,
"y": 32
},
"height": "200px",
"id": 303,
"isNew": true,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 200,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 2,
"links": [],
"nullPointMode": "connected",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(container_memory_working_set_bytes{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}) by (name, image, job, instance)",
"format": "time_series",
"interval": "10s",
"intervalFactor": 1,
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
"refId": "C"
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Container Memory Usage (1m avg)",
"tooltip": {
"msResolution": false,
"shared": true,
"sort": 0,
"value_type": "cumulative"
},
"transparent": false,
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "decbytes",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "Bps",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 2,
"description": "Container Network I/O",
"editable": true,
"error": false,
"fill": 0,
"grid": {},
"gridPos": {
"h": 13,
"w": 12,
"x": 0,
"y": 45
},
"height": "200px",
"id": 296,
"isNew": true,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 200,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 2,
"links": [],
"nullPointMode": "connected",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(container_network_receive_bytes_total{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}[1m])) by (name, image, job, instance)",
"format": "time_series",
"intervalFactor": 1,
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
"refId": "C"
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Container Network I/O (1m avg)",
"tooltip": {
"msResolution": false,
"shared": true,
"sort": 0,
"value_type": "cumulative"
},
"transparent": false,
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "Bps",
"label": null,
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "Bps",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 2,
"description": "Container Disk Usage",
"editable": true,
"error": false,
"fill": 0,
"grid": {},
"gridPos": {
"h": 13,
"w": 12,
"x": 12,
"y": 45
},
"height": "200px",
"id": 304,
"isNew": true,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": false,
"min": false,
"rightSide": false,
"show": true,
"sideWidth": 200,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 2,
"links": [],
"nullPointMode": "connected",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(container_fs_usage_bytes{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}) by (name, image, job, instance)",
"format": "time_series",
"interval": "10s",
"intervalFactor": 1,
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
"refId": "C"
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Container Disk Usage (1m avg)",
"tooltip": {
"msResolution": false,
"shared": true,
"sort": 0,
"value_type": "cumulative"
},
"transparent": false,
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "decbytes",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "Bps",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 2,
"description": "Container Write Usage",
"editable": true,
"error": false,
"fill": 0,
"grid": {},
"gridPos": {
"h": 12,
"w": 12,
"x": 0,
"y": 58
},
"height": "200px",
"id": 305,
"isNew": true,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": false,
"min": false,
"rightSide": false,
"show": true,
"sideWidth": 200,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 2,
"links": [],
"nullPointMode": "connected",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(container_fs_writes_bytes_total{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}) by (name, image, job, instance)",
"format": "time_series",
"interval": "10s",
"intervalFactor": 1,
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
"refId": "C"
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Container Aggregate Write (1m avg)",
"tooltip": {
"msResolution": false,
"shared": true,
"sort": 0,
"value_type": "cumulative"
},
"transparent": false,
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "decbytes",
"label": null,
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"decimals": null,
"format": "none",
"label": "",
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 2,
"description": "Container Read Usage",
"editable": true,
"error": false,
"fill": 0,
"grid": {},
"gridPos": {
"h": 12,
"w": 12,
"x": 12,
"y": 58
},
"height": "200px",
"id": 306,
"isNew": true,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": false,
"min": false,
"rightSide": false,
"show": true,
"sideWidth": 200,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 2,
"links": [],
"nullPointMode": "connected",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(container_fs_reads_bytes_total{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}) by (name, image, job, instance)",
"format": "time_series",
"interval": "10s",
"intervalFactor": 1,
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
"refId": "C"
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Container Aggregate Read (1m avg)",
"tooltip": {
"msResolution": false,
"shared": true,
"sort": 0,
"value_type": "cumulative"
},
"transparent": false,
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "decbytes",
"label": null,
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"decimals": null,
"format": "none",
"label": "",
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"title": "Container Metrics",
"type": "row"
},
{
"collapsed": true,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 8
},
"id": 263,
"panels": [
{
"aliasColors": {
"Idle - Waiting for something to happen": "#052B51",
"guest": "#9AC48A",
"idle": "#052B51",
"iowait": "#EAB839",
"irq": "#BF1B00",
"nice": "#C15C17",
"softirq": "#E24D42",
"steal": "#FCE2DE",
"system": "#508642",
"user": "#5195CE"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 2,
"description": "",
"fill": 4,
"gridPos": {
"h": 12,
"w": 12,
"x": 0,
"y": 9
},
"id": 3,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 250,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": true,
"pointradius": 5,
"points": false,
"renderer": "flot",
"repeat": null,
"seriesOverrides": [],
"spaceLength": 10,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode=\"system\",instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"interval": "10s",
"intervalFactor": 2,
"legendFormat": "System - Processes executing in kernel mode",
"refId": "A",
"step": 20
},
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='user',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "User - Normal processes executing in user mode",
"refId": "B",
"step": 240
},
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='nice',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Nice - Niced processes executing in user mode",
"refId": "C",
"step": 240
},
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='idle',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Idle - Waiting for something to happen",
"refId": "F",
"step": 240
},
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='iowait',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Iowait - Waiting for I/O to complete",
"refId": "D",
"step": 240
},
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='irq',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Irq - Servicing interrupts",
"refId": "G",
"step": 240
},
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='softirq',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Softirq - Servicing softirqs",
"refId": "H",
"step": 240
},
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='steal',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Steal - Time spent in other operating systems when running in a virtualized environment",
"refId": "E",
"step": 240
},
{
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='guest',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Guest - Time spent running a virtual CPU for a guest operating system",
"refId": "I",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "CPU",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"transparent": false,
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Percentage",
"logBase": 1,
"max": "100",
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {
"Apps": "#629E51",
"Buffers": "#614D93",
"Cache": "#6D1F62",
"Cached": "#511749",
"Committed": "#508642",
"Free": "#0A437C",
"Harware Corrupted - Amount of RAM that the kernel identified as corrupted / not working": "#CFFAFF",
"Inactive": "#584477",
"PageTables": "#0A50A1",
"Page_Tables": "#0A50A1",
"RAM_Free": "#E0F9D7",
"Slab": "#806EB7",
"Slab_Cache": "#E0752D",
"Swap": "#BF1B00",
"Swap - Swap memory usage": "#BF1B00",
"Swap_Cache": "#C15C17",
"Swap_Free": "#2F575E",
"Unused": "#EAB839",
"Unused - Free memory unasigned": "#052B51"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 2,
"description": "",
"fill": 4,
"gridPos": {
"h": 12,
"w": 12,
"x": 12,
"y": 9
},
"id": 24,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 350,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*Harware Corrupted - *./",
"stack": false
}
],
"spaceLength": 10,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "node_memory_MemTotal_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_MemFree_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_Buffers_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_Cached_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_Slab_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_PageTables_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_SwapCached_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "Apps - Memory used by user-space applications",
"refId": "Q",
"step": 240
},
{
"expr": "node_memory_PageTables_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "PageTables - Memory used to map between virtual and physical memory addresses",
"refId": "G",
"step": 240
},
{
"expr": "node_memory_SwapCached_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "SwapCache - Memory that keeps track of pages that have been fetched from swap but not yet been modified",
"refId": "F",
"step": 240
},
{
"expr": "node_memory_Slab_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "Slab - Memory used by the kernel to cache data structures for its own use (caches like inode, dentry, etc)",
"refId": "E",
"step": 240
},
{
"expr": "node_memory_Cached_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "Cache - Parked file data (file content) cache",
"refId": "C",
"step": 240
},
{
"expr": "node_memory_Buffers_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "Buffers - Block device (e.g. harddisk) cache",
"refId": "B",
"step": 240
},
{
"expr": "node_memory_MemFree_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "Unused - Free memory unasigned",
"refId": "D",
"step": 240
},
{
"expr": "(node_memory_SwapTotal_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_SwapFree_bytes{instance=~\"($node):$port\",job=~\"$job\"})",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "Swap - Swap space used",
"refId": "I",
"step": 240
},
{
"expr": "node_memory_HardwareCorrupted_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "Harware Corrupted - Amount of RAM that the kernel identified as corrupted / not working",
"refId": "O",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Memory Stack",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "bytes",
"label": "Bytes",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {
"receive_packets_eth0": "#7EB26D",
"receive_packets_lo": "#E24D42",
"transmit_packets_eth0": "#7EB26D",
"transmit_packets_lo": "#E24D42"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 4,
"gridPos": {
"h": 12,
"w": 12,
"x": 0,
"y": 21
},
"id": 84,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*Trans.*/",
"transform": "negative-Y"
},
{
"alias": "/.*lo.*/",
"color": "#7EB26D"
},
{
"alias": "/.*eth0.*/",
"color": "#EAB839"
},
{
"alias": "/.*eth1.*/",
"color": "#6ED0E0"
},
{
"alias": "/.*eth2.*/",
"color": "#EF843C"
},
{
"alias": "/.*eth3.*/",
"color": "#E24D42"
},
{
"alias": "/.*eth4.*/",
"color": "#1F78C1"
},
{
"alias": "/.*eth5.*/",
"color": "#BA43A9"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "irate(node_network_receive_bytes_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Receive",
"refId": "O",
"step": 240
},
{
"expr": "irate(node_network_transmit_bytes_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Transmit",
"refId": "P",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Network Traffic",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "Bps",
"label": "Bytes out (-) / in (+)",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"repeat": null,
"title": "CPU/Memory/Network Detailed Overview",
"type": "row"
},
{
"collapsed": true,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 9
},
"id": 271,
"panels": [
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 3,
"description": "",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 10
},
"id": 43,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_filesystem_avail_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "{{mountpoint}} - Available",
"metric": "",
"refId": "A",
"step": 4
},
{
"expr": "node_filesystem_free_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
"format": "time_series",
"hide": true,
"intervalFactor": 2,
"legendFormat": "{{mountpoint}} - Free",
"refId": "B",
"step": 2
},
{
"expr": "node_filesystem_size_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
"format": "time_series",
"hide": true,
"intervalFactor": 2,
"legendFormat": "{{mountpoint}} - Size",
"refId": "D",
"step": 2
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Filesystem space available",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "bytes",
"label": "Bytes",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"description": "",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 10
},
"id": 41,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideZero": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_filesystem_files_free{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "{{mountpoint}} - Free file nodes",
"refId": "B",
"step": 4
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "File Nodes Free",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "File Nodes",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"description": "",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 20
},
"id": 28,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_filefd_maximum{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 4,
"legendFormat": "Max open files",
"refId": "A",
"step": 8
},
{
"expr": "node_filefd_allocated{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Open files",
"refId": "B",
"step": 4
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "File Descriptor",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Files",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"description": "",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 20
},
"id": 219,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideZero": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_filesystem_files{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "{{mountpoint}} - File nodes total",
"refId": "A",
"step": 4
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "File Nodes Size",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "File Nodes",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"repeat": null,
"title": "Filesystem Metrics",
"type": "row"
},
{
"collapsed": true,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 10
},
"id": 265,
"panels": [
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 3,
"description": "",
"fill": 4,
"gridPos": {
"h": 12,
"w": 12,
"x": 0,
"y": 9
},
"height": "",
"id": 156,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sort": "current",
"sortDesc": false,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_filesystem_size_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'} - node_filesystem_avail_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{mountpoint}}",
"refId": "A",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Disk Space Used",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "bytes",
"label": "Bytes",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {
"io time": "#890F02"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 3,
"description": "",
"fill": 4,
"gridPos": {
"h": 12,
"w": 12,
"x": 12,
"y": 9
},
"id": 42,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*read*./",
"transform": "negative-Y"
},
{
"alias": "/.*sda.*/",
"color": "#7EB26D"
},
{
"alias": "/.*sdb.*/",
"color": "#EAB839"
},
{
"alias": "/.*sdc.*/",
"color": "#6ED0E0"
},
{
"alias": "/.*sdd.*/",
"color": "#EF843C"
},
{
"alias": "/.*sde.*/",
"color": "#E24D42"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "irate(node_disk_read_bytes_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"}[5m])",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "{{device}} - Successfully read bytes",
"refId": "A",
"step": 240
},
{
"expr": "irate(node_disk_written_bytes_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"}[5m])",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "{{device}} - Successfully written bytes",
"refId": "B",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "I/O Usage Read / Write",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": false,
"values": []
},
"yaxes": [
{
"format": "bytes",
"label": "Bytes read (-) / write (+)",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "ms",
"label": "",
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"description": "",
"fill": 2,
"gridPos": {
"h": 12,
"w": 12,
"x": 0,
"y": 21
},
"id": 229,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideZero": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*Read.*/",
"transform": "negative-Y"
},
{
"alias": "/.*sda_.*/",
"color": "#7EB26D"
},
{
"alias": "/.*sdb_.*/",
"color": "#EAB839"
},
{
"alias": "/.*sdc_.*/",
"color": "#6ED0E0"
},
{
"alias": "/.*sdd_.*/",
"color": "#EF843C"
},
{
"alias": "/.*sde_.*/",
"color": "#E24D42"
},
{
"alias": "/.*sda1.*/",
"color": "#584477"
},
{
"alias": "/.*sda2_.*/",
"color": "#BA43A9"
},
{
"alias": "/.*sda3_.*/",
"color": "#F4D598"
},
{
"alias": "/.*sdb1.*/",
"color": "#0A50A1"
},
{
"alias": "/.*sdb2.*/",
"color": "#BF1B00"
},
{
"alias": "/.*sdb3.*/",
"color": "#E0752D"
},
{
"alias": "/.*sdc1.*/",
"color": "#962D82"
},
{
"alias": "/.*sdc2.*/",
"color": "#614D93"
},
{
"alias": "/.*sdc3.*/",
"color": "#9AC48A"
},
{
"alias": "/.*sdd1.*/",
"color": "#65C5DB"
},
{
"alias": "/.*sdd2.*/",
"color": "#F9934E"
},
{
"alias": "/.*sdd3.*/",
"color": "#EA6460"
},
{
"alias": "/.*sde1.*/",
"color": "#E0F9D7"
},
{
"alias": "/.*sdd2.*/",
"color": "#FCEACA"
},
{
"alias": "/.*sde3.*/",
"color": "#F9E2D2"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "irate(node_disk_reads_completed_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"}[5m])",
"format": "time_series",
"intervalFactor": 4,
"legendFormat": "{{device}} - Reads completed",
"refId": "A",
"step": 480
},
{
"expr": "irate(node_disk_writes_completed_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Writes completed",
"refId": "B",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Disk IOps",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "iops",
"label": "IO read (-) / write (+)",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {
"io time": "#890F02"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"decimals": 3,
"description": "",
"fill": 4,
"gridPos": {
"h": 12,
"w": 12,
"x": 12,
"y": 21
},
"id": 127,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sort": null,
"sortDesc": null,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "irate(node_disk_io_time_seconds_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"} [5m])",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "{{device}} - Milliseconds spent doing I/Os",
"refId": "C",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "I/O Usage Times",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": false,
"values": []
},
"yaxes": [
{
"format": "ms",
"label": "Milliseconds",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "ms",
"label": "",
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"repeat": null,
"title": "Disk Metrics",
"type": "row"
},
{
"collapsed": true,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 11
},
"id": 272,
"panels": [
{
"aliasColors": {
"receive_packets_eth0": "#7EB26D",
"receive_packets_lo": "#E24D42",
"transmit_packets_eth0": "#7EB26D",
"transmit_packets_lo": "#E24D42"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 12
},
"id": 60,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 300,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*Trans.*/",
"transform": "negative-Y"
},
{
"alias": "/.*lo.*/",
"color": "#7EB26D"
},
{
"alias": "/.*eth0.*/",
"color": "#EAB839"
},
{
"alias": "/.*eth1.*/",
"color": "#6ED0E0"
},
{
"alias": "/.*eth2.*/",
"color": "#EF843C"
},
{
"alias": "/.*eth3.*/",
"color": "#E24D42"
},
{
"alias": "/.*eth4.*/",
"color": "#1F78C1"
},
{
"alias": "/.*eth5.*/",
"color": "#BA43A9"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "irate(node_network_receive_packets_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Receive",
"refId": "O",
"step": 4
},
{
"expr": "irate(node_network_transmit_packets_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Transmit",
"refId": "P",
"step": 4
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Network Traffic by Packets",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "pps",
"label": "Packets out (-) / in (+)",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 12
},
"id": 142,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideEmpty": false,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 300,
"sort": "current",
"sortDesc": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*Trans.*/",
"transform": "negative-Y"
},
{
"alias": "/.*lo.*.errors.*/",
"color": "#7EB26D"
},
{
"alias": "/.*eth0.*.errors.*/",
"color": "#EAB839"
},
{
"alias": "/.*eth1.*.errors.*/",
"color": "#6ED0E0"
},
{
"alias": "/.*eth2.*.errors.*/",
"color": "#EF843C"
},
{
"alias": "/.*eth3.*.errors.*/",
"color": "#E24D42"
},
{
"alias": "/.*eth4.*.errors.*/",
"color": "#1F78C1"
},
{
"alias": "/.*eth5.*.errors.*/",
"color": "#BA43A9"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "irate(node_network_receive_errs_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Receive errors",
"refId": "E",
"step": 4
},
{
"expr": "irate(node_network_transmit_errs_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Rransmit errors",
"refId": "F",
"step": 4
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Network Traffic Errors",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "pps",
"label": "Packets out (-) / in (+)",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 22
},
"id": 143,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideEmpty": false,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 300,
"sort": "current",
"sortDesc": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*Trans.*/",
"transform": "negative-Y"
},
{
"alias": "/.*lo.*.drop.*/",
"color": "#7EB26D"
},
{
"alias": "/.*eth0.*.drop.*/",
"color": "#EAB839"
},
{
"alias": "/.*eth1.*.drop.*/",
"color": "#6ED0E0"
},
{
"alias": "/.*eth2.*.drop.*/",
"color": "#EF843C"
},
{
"alias": "/.*eth3.*.drop.*/",
"color": "#E24D42"
},
{
"alias": "/.*eth4.*.drop.*/",
"color": "#1F78C1"
},
{
"alias": "/.*eth5.*.drop.*/",
"color": "#BA43A9"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "irate(node_network_receive_drop_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Receive drop",
"refId": "G",
"step": 4
},
{
"expr": "irate(node_network_transmit_drop_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{device}} - Transmit drop",
"refId": "H",
"step": 4
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Network Traffic Drop",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "pps",
"label": "Packets out (-) / in (+)",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 22
},
"id": 61,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "NF conntrack limit",
"color": "#890F02",
"fill": 0
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_nf_conntrack_entries{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "NF conntrack entries",
"refId": "O",
"step": 4
},
{
"expr": "node_nf_conntrack_entries_limit{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "NF conntrack limit",
"refId": "P",
"step": 4
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "NF Contrack",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Entries",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 32
},
"id": 63,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideEmpty": false,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 300,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_sockstat_TCP_alloc{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "TCP_alloc - Allocated sockets",
"refId": "D",
"step": 240
},
{
"expr": "node_sockstat_TCP_inuse{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "TCP_inuse - Tcp sockets currently in use",
"refId": "E",
"step": 240
},
{
"expr": "node_sockstat_TCP_mem{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "TCP_mem - Used memory for tcp",
"refId": "F",
"step": 240
},
{
"expr": "node_sockstat_TCP_orphan{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "TCP_orphan - Orphan sockets",
"refId": "H",
"step": 240
},
{
"expr": "node_sockstat_TCP_tw{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "TCP_tw - Sockets wating close",
"refId": "I",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Sockstat TCP",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Sockets",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 32
},
"id": 124,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideEmpty": false,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 300,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_sockstat_UDPLITE_inuse{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "UDPLITE_inuse - Udplite sockets currently in use",
"refId": "J",
"step": 240
},
{
"expr": "node_sockstat_UDP_inuse{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "UDP_inuse - Udp sockets currently in use",
"refId": "K",
"step": 240
},
{
"expr": "node_sockstat_UDP_mem{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "UDP_mem - Used memory for udp",
"refId": "L",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Sockstat UDP",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Sockets",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 42
},
"id": 126,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideEmpty": false,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 300,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_sockstat_sockets_used{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Sockets_used - Sockets currently in use",
"refId": "N",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Sockstat Used",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Sockets",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 42
},
"id": 220,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideEmpty": false,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sideWidth": 300,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_sockstat_TCP_mem_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "TCP_mem_bytes - ",
"refId": "G",
"step": 240
},
{
"expr": "node_sockstat_UDP_mem_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "UDP_mem_bytes - ",
"refId": "A",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Sockstat Memory Size",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "bytes",
"label": "Bytes",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"repeat": null,
"title": "Network Detailed Metrics",
"type": "row"
},
{
"collapsed": true,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 12
},
"id": 269,
"panels": [
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 13
},
"id": 7,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"repeat": null,
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_load1{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 4,
"legendFormat": "Load 1m",
"refId": "A",
"step": 480
},
{
"expr": "node_load5{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 4,
"legendFormat": "Load 5m",
"refId": "B",
"step": 480
},
{
"expr": "node_load15{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 4,
"legendFormat": "Load 15m",
"refId": "C",
"step": 480
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "System Load",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Load",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 13
},
"id": 62,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_procs_blocked{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Processes blocked waiting for I/O to complete",
"refId": "A",
"step": 240
},
{
"expr": "node_procs_running{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Processes in runnable state",
"refId": "B",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Processes State",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Processes",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 23
},
"id": 149,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "process_virtual_memory_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"interval": "",
"intervalFactor": 2,
"legendFormat": "Processes virtual memory size in bytes",
"refId": "C",
"step": 240
},
{
"expr": "process_resident_memory_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
"interval": "",
"intervalFactor": 2,
"legendFormat": "Processes resident memory size in bytes",
"refId": "A",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Processes Memory",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "decbytes",
"label": "Bytes",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 23
},
"id": 64,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*Max*./",
"color": "#890F02",
"fill": 0
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "process_max_fds{instance=~\"($node):$port\",job=~\"$job\"}",
"interval": "",
"intervalFactor": 2,
"legendFormat": "Maximum open file descriptors",
"refId": "A",
"step": 240
},
{
"expr": "process_open_fds{instance=~\"($node):$port\",job=~\"$job\"}",
"interval": "",
"intervalFactor": 2,
"legendFormat": "Open file descriptors",
"refId": "B",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "File Descriptors",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Descriptors",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 33
},
"id": 8,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"repeat": null,
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "irate(node_context_switches_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Context switches",
"refId": "A",
"step": 240
},
{
"expr": "irate(node_intr_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Interrupts",
"refId": "B",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Context Switches / Interrupts",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Counter",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 33
},
"id": 148,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 4,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "rate(node_forks_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
"format": "time_series",
"hide": false,
"intervalFactor": 2,
"legendFormat": "Processes forks second",
"refId": "C",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Processes Forks",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Forks / sec",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"description": "",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 43
},
"id": 260,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "/.*Variation*./",
"color": "#890F02"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_timex_estimated_error_seconds{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"interval": "",
"intervalFactor": 2,
"legendFormat": "Estimated error in seconds",
"refId": "B",
"step": 240
},
{
"expr": "node_timex_offset_seconds{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"interval": "",
"intervalFactor": 2,
"legendFormat": "Time offset in between local system and reference clock",
"refId": "A",
"step": 240
},
{
"expr": "node_timex_maxerror_seconds{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"interval": "",
"intervalFactor": 2,
"legendFormat": "Maximum error in seconds",
"refId": "C",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "Time Syncronized Drift",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "s",
"label": "Seconds",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"repeat": null,
"title": "System Metrics",
"type": "row"
},
{
"collapsed": true,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 13
},
"id": 314,
"panels": [
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 14
},
"height": "",
"id": 316,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sortDesc": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 2,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_mountstats_nfs_transport_connect_total{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"instant": false,
"interval": "",
"intervalFactor": 1,
"legendFormat": "NFS client connections",
"refId": "C",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "NFS Client Connections",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Connections",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {
"receive_packets_eth0": "#7EB26D",
"receive_packets_lo": "#E24D42",
"transmit_packets_eth0": "#7EB26D",
"transmit_packets_lo": "#E24D42"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 3,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 14
},
"id": 315,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "Read",
"transform": "negative-Y"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(node_mountstats_nfs_write_bytes_total{instance=~\"($node):$port\",job=~\"$job\"}[1m]))",
"format": "time_series",
"hide": false,
"instant": false,
"interval": "",
"intervalFactor": 1,
"legendFormat": "Write",
"refId": "A",
"step": 240
},
{
"expr": "sum(rate(node_mountstats_nfs_read_bytes_total{instance=~\"($node):$port\",job=~\"$job\"}[1m]))",
"format": "time_series",
"hide": false,
"interval": "",
"intervalFactor": 1,
"legendFormat": "Read",
"refId": "B"
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "NFS Client I/O",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "Bps",
"label": "",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"title": "NFS Client Metrics",
"type": "row"
},
{
"collapsed": true,
"gridPos": {
"h": 1,
"w": 24,
"x": 0,
"y": 14
},
"id": 310,
"panels": [
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 2,
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 15
},
"height": "",
"id": 308,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"hideZero": false,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"sortDesc": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"minSpan": 2,
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_nfsd_connections_total{instance=~\"($node):$port\",job=~\"$job\"}",
"format": "time_series",
"hide": false,
"instant": false,
"interval": "",
"intervalFactor": 1,
"legendFormat": "NFS kernel server connections",
"refId": "C",
"step": 240
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "NFS Kernel Server Connections",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": "Connections",
"logBase": 1,
"max": null,
"min": "0",
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {
"receive_packets_eth0": "#7EB26D",
"receive_packets_lo": "#E24D42",
"transmit_packets_eth0": "#7EB26D",
"transmit_packets_lo": "#E24D42"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fill": 3,
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 15
},
"id": 312,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": false,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [
{
"alias": "Read",
"transform": "negative-Y"
}
],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(node_nfsd_disk_bytes_written_total{instance=~\"($node):$port\",job=~\"$job\"}[1m]))",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"legendFormat": "Write",
"refId": "A",
"step": 240
},
{
"expr": "sum(rate(node_nfsd_disk_bytes_read_total{instance=~\"($node):$port\",job=~\"$job\"}[1m]))",
"format": "time_series",
"hide": false,
"intervalFactor": 1,
"legendFormat": "Read",
"refId": "B"
}
],
"thresholds": [],
"timeFrom": null,
"timeShift": null,
"title": "NFS Kernel Server I/O",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "Bps",
"label": "",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"title": "NFS Kernel Server Metrics",
"type": "row"
}
],
"refresh": "5s",
"schemaVersion": 16,
"style": "dark",
"tags": [],
"templating": {
"list": [
{
"allValue": null,
"current": {},
"datasource": "Prometheus",
"hide": 0,
"includeAll": true,
"label": "Resource",
"multi": false,
"name": "job",
"options": [],
"query": "label_values(node_boot_time_seconds, job)",
"refresh": 2,
"regex": "",
"sort": 1,
"tagValuesQuery": "",
"tags": [],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": null,
"current": {},
"datasource": "Prometheus",
"hide": 0,
"includeAll": true,
"label": "Node",
"multi": false,
"name": "node",
"options": [],
"query": "label_values(node_boot_time_seconds{job=~\"$job\"}, instance)",
"refresh": 2,
"regex": "/([^:]+):.*/",
"sort": 1,
"tagValuesQuery": "",
"tags": [],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": null,
"current": {},
"datasource": "Prometheus",
"hide": 2,
"includeAll": false,
"label": "Port (NE)",
"multi": false,
"name": "port",
"options": [],
"query": "label_values(node_boot_time_seconds{instance=~\"$node:(.*)\"}, instance)",
"refresh": 2,
"regex": "/[^:]+:(.*)/",
"sort": 3,
"tagValuesQuery": "",
"tags": [],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": null,
"current": {},
"datasource": "Prometheus",
"hide": 2,
"includeAll": false,
"label": "Port (CA)",
"multi": false,
"name": "port_ca",
"options": [],
"query": "label_values(cadvisor_version_info{instance=~\"$node:(.*)\"}, instance)",
"refresh": 2,
"regex": "/[^:]+:(.*)/",
"sort": 0,
"tagValuesQuery": "",
"tags": [],
"tagsQuery": "",
"type": "query",
"useTags": false
}
]
},
"time": {
"from": "now-15m",
"to": "now"
},
"timepicker": {
"refresh_intervals": [
"5s",
"10s",
"30s",
"1m",
"5m",
"15m",
"30m",
"1h",
"2h",
"1d"
],
"time_options": [
"5m",
"15m",
"1h",
"6h",
"12h",
"24h",
"2d",
"7d",
"30d"
]
},
"timezone": "utc",
"title": "Batch Shipyard Dashboard",
"uid": "absdash",
"version": 1
}