5268 строки
138 KiB
JSON
5268 строки
138 KiB
JSON
{
|
|
"__requires": [
|
|
{
|
|
"type": "grafana",
|
|
"id": "grafana",
|
|
"name": "Grafana",
|
|
"version": "5.1.3"
|
|
},
|
|
{
|
|
"type": "panel",
|
|
"id": "graph",
|
|
"name": "Graph",
|
|
"version": "5.0.0"
|
|
},
|
|
{
|
|
"type": "datasource",
|
|
"id": "prometheus",
|
|
"name": "Prometheus",
|
|
"version": "5.0.0"
|
|
},
|
|
{
|
|
"type": "panel",
|
|
"id": "singlestat",
|
|
"name": "Singlestat",
|
|
"version": "5.0.0"
|
|
}
|
|
],
|
|
"annotations": {
|
|
"list": [
|
|
{
|
|
"builtIn": 1,
|
|
"datasource": "-- Grafana --",
|
|
"enable": true,
|
|
"hide": true,
|
|
"iconColor": "rgba(0, 211, 255, 1)",
|
|
"limit": 100,
|
|
"name": "Annotations & Alerts",
|
|
"showIn": 0,
|
|
"type": "dashboard"
|
|
}
|
|
]
|
|
},
|
|
"description": "Dashboard for Batch Shipyard resources",
|
|
"editable": true,
|
|
"gnetId": null,
|
|
"graphTooltip": 0,
|
|
"id": null,
|
|
"iteration": 1528233885724,
|
|
"links": [],
|
|
"panels": [
|
|
{
|
|
"collapsed": false,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 0
|
|
},
|
|
"id": 286,
|
|
"panels": [],
|
|
"title": "Aggregate Overview for Resource",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": false,
|
|
"colors": [
|
|
"rgba(245, 54, 54, 0.9)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(50, 172, 45, 0.97)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"description": "Total number of nodes",
|
|
"format": "short",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": false,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 3,
|
|
"w": 2,
|
|
"x": 0,
|
|
"y": 1
|
|
},
|
|
"id": 289,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": false
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "count(count(node_cpu_seconds_total{job=~\"$job\"}) without (cpu, mode))",
|
|
"format": "time_series",
|
|
"intervalFactor": 1,
|
|
"refId": "B"
|
|
}
|
|
],
|
|
"thresholds": "",
|
|
"title": "Nodes",
|
|
"type": "singlestat",
|
|
"valueFontSize": "50%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": false,
|
|
"colors": [
|
|
"rgba(245, 54, 54, 0.9)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(50, 172, 45, 0.97)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"decimals": 1,
|
|
"description": "System uptime",
|
|
"format": "s",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": false,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 2,
|
|
"w": 4,
|
|
"x": 2,
|
|
"y": 1
|
|
},
|
|
"hideTimeOverride": true,
|
|
"id": 290,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "s",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": false
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "avg(node_time_seconds{job=~\"$job\"}) - avg(node_boot_time_seconds{job=~\"$job\"})",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"refId": "A",
|
|
"step": 1800
|
|
}
|
|
],
|
|
"thresholds": "",
|
|
"title": "Average Uptime",
|
|
"transparent": false,
|
|
"type": "singlestat",
|
|
"valueFontSize": "50%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": false,
|
|
"colors": [
|
|
"rgba(245, 54, 54, 0.9)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(50, 172, 45, 0.97)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "Total Memory",
|
|
"format": "bytes",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": false,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 2,
|
|
"w": 4,
|
|
"x": 6,
|
|
"y": 1
|
|
},
|
|
"id": 288,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "70%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": false
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "sum(node_memory_MemTotal_bytes{job=~\"$job\"})",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"refId": "A",
|
|
"step": 900
|
|
}
|
|
],
|
|
"thresholds": "",
|
|
"title": "Total Memory",
|
|
"type": "singlestat",
|
|
"valueFontSize": "50%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"aliasColors": {
|
|
"Recv_bytes_eth2": "#7EB26D",
|
|
"Recv_bytes_lo": "#0A50A1",
|
|
"Recv_drop_eth2": "#6ED0E0",
|
|
"Recv_drop_lo": "#E0F9D7",
|
|
"Recv_errs_eth2": "#BF1B00",
|
|
"Recv_errs_lo": "#CCA300",
|
|
"Trans_bytes_eth2": "#7EB26D",
|
|
"Trans_bytes_lo": "#0A50A1",
|
|
"Trans_drop_eth2": "#6ED0E0",
|
|
"Trans_drop_lo": "#E0F9D7",
|
|
"Trans_errs_eth2": "#BF1B00",
|
|
"Trans_errs_lo": "#CCA300",
|
|
"recv_bytes_lo": "#0A50A1",
|
|
"recv_drop_eth0": "#99440A",
|
|
"recv_drop_lo": "#967302",
|
|
"recv_errs_eth0": "#BF1B00",
|
|
"recv_errs_lo": "#890F02",
|
|
"trans_bytes_eth0": "#7EB26D",
|
|
"trans_bytes_lo": "#0A50A1",
|
|
"trans_drop_eth0": "#99440A",
|
|
"trans_drop_lo": "#967302",
|
|
"trans_errs_eth0": "#BF1B00",
|
|
"trans_errs_lo": "#890F02"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"description": "Aggregate Network traffic on all devices",
|
|
"fill": 4,
|
|
"gridPos": {
|
|
"h": 6,
|
|
"w": 6,
|
|
"x": 10,
|
|
"y": 1
|
|
},
|
|
"id": 300,
|
|
"legend": {
|
|
"alignAsTable": false,
|
|
"avg": false,
|
|
"current": false,
|
|
"hideEmpty": false,
|
|
"hideZero": false,
|
|
"max": false,
|
|
"min": false,
|
|
"rightSide": false,
|
|
"show": false,
|
|
"sort": "current",
|
|
"sortDesc": true,
|
|
"total": false,
|
|
"values": false
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*trans.*/",
|
|
"transform": "negative-Y"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(rate(node_network_receive_bytes_total{job=~\"$job\"}[1m]))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "receive",
|
|
"refId": "A",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum(rate(node_network_transmit_bytes_total{job=~\"$job\"}[1m]))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "transmit",
|
|
"refId": "B",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Network Traffic",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"transparent": false,
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "bytes",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "pps",
|
|
"label": "",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": false,
|
|
"colors": [
|
|
"rgba(50, 172, 45, 0.97)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(245, 54, 54, 0.9)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"decimals": null,
|
|
"description": "Smallest free ephemeral disk space on a node",
|
|
"format": "bytes",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": false,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 2,
|
|
"w": 4,
|
|
"x": 16,
|
|
"y": 1
|
|
},
|
|
"id": 293,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": false
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "min(node_filesystem_avail_bytes{device=\"/dev/sdb1\",job=~\"$job\"})",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"refId": "A",
|
|
"step": 900
|
|
}
|
|
],
|
|
"thresholds": "70,90",
|
|
"title": "Min Free Ephemeral FS Space",
|
|
"type": "singlestat",
|
|
"valueFontSize": "50%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": false,
|
|
"colors": [
|
|
"rgba(50, 172, 45, 0.97)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(245, 54, 54, 0.9)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"decimals": null,
|
|
"description": "Smallest free root disk space on a node",
|
|
"format": "bytes",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": false,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 2,
|
|
"w": 4,
|
|
"x": 20,
|
|
"y": 1
|
|
},
|
|
"id": 294,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": false
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "min(node_filesystem_avail_bytes{mountpoint=\"/\",job=~\"$job\"})",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"refId": "A",
|
|
"step": 900
|
|
}
|
|
],
|
|
"thresholds": "70,90",
|
|
"title": "Min Free Root FS Space",
|
|
"type": "singlestat",
|
|
"valueFontSize": "50%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": true,
|
|
"colors": [
|
|
"rgba(50, 172, 45, 0.97)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(245, 54, 54, 0.9)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"decimals": null,
|
|
"description": "Core usage across all nodes",
|
|
"format": "percent",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": true,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 4,
|
|
"w": 4,
|
|
"x": 2,
|
|
"y": 3
|
|
},
|
|
"id": 282,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 2,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": true
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "100 * (1 - avg(irate(node_cpu_seconds_total{mode=\"idle\",job=~\"$job\"}[1m])))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"legendFormat": "",
|
|
"refId": "A",
|
|
"step": 900
|
|
}
|
|
],
|
|
"thresholds": "85,95",
|
|
"title": "CPU Usage",
|
|
"type": "singlestat",
|
|
"valueFontSize": "80%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": true,
|
|
"colors": [
|
|
"rgba(50, 172, 45, 0.97)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(245, 54, 54, 0.9)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"decimals": 0,
|
|
"description": "Memory Used by all nodes",
|
|
"format": "percent",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": true,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 4,
|
|
"w": 4,
|
|
"x": 6,
|
|
"y": 3
|
|
},
|
|
"hideTimeOverride": false,
|
|
"id": 16,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": true
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "100 * (sum(node_memory_MemTotal_bytes{job=~\"$job\"}) - sum(node_memory_MemAvailable_bytes{job=~\"$job\"})) / sum(node_memory_MemTotal_bytes{job=~\"$job\"})",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"refId": "B",
|
|
"step": 900
|
|
}
|
|
],
|
|
"thresholds": "80,90",
|
|
"title": "Memory Usage",
|
|
"type": "singlestat",
|
|
"valueFontSize": "80%",
|
|
"valueMaps": [],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": true,
|
|
"colors": [
|
|
"rgba(50, 172, 45, 0.97)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(245, 54, 54, 0.9)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"decimals": null,
|
|
"description": "Average used ephemeral FS",
|
|
"format": "percent",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": true,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 4,
|
|
"w": 4,
|
|
"x": 16,
|
|
"y": 3
|
|
},
|
|
"id": 291,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": true
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "100 * ((sum(node_filesystem_size_bytes{device=\"/dev/sdb1\",job=~\"$job\"}) - sum(node_filesystem_avail_bytes{device=\"/dev/sdb1\",job=~\"$job\"})) / sum(node_filesystem_size_bytes{device=\"/dev/sdb1\",job=~\"$job\"}))",
|
|
"format": "time_series",
|
|
"intervalFactor": 1,
|
|
"refId": "A",
|
|
"step": 900
|
|
}
|
|
],
|
|
"thresholds": "80,90",
|
|
"title": "Ephemeral FS Usage",
|
|
"type": "singlestat",
|
|
"valueFontSize": "80%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": true,
|
|
"colors": [
|
|
"rgba(50, 172, 45, 0.97)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(245, 54, 54, 0.9)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"decimals": null,
|
|
"description": "Average Used Root FS",
|
|
"format": "percent",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": true,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 4,
|
|
"w": 4,
|
|
"x": 20,
|
|
"y": 3
|
|
},
|
|
"id": 292,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": true
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "100 * ((sum(node_filesystem_size_bytes{mountpoint=\"/\",job=~\"$job\"}) - sum(node_filesystem_avail_bytes{mountpoint=\"/\",job=~\"$job\"})) / sum(node_filesystem_size_bytes{mountpoint=\"/\",job=~\"$job\"}))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"refId": "A",
|
|
"step": 900
|
|
}
|
|
],
|
|
"thresholds": "80,90",
|
|
"title": "Root FS Usage",
|
|
"type": "singlestat",
|
|
"valueFontSize": "80%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"cacheTimeout": null,
|
|
"colorBackground": false,
|
|
"colorValue": false,
|
|
"colors": [
|
|
"rgba(245, 54, 54, 0.9)",
|
|
"rgba(237, 129, 40, 0.89)",
|
|
"rgba(50, 172, 45, 0.97)"
|
|
],
|
|
"datasource": "Prometheus",
|
|
"description": "Total number of CPU cores",
|
|
"format": "short",
|
|
"gauge": {
|
|
"maxValue": 100,
|
|
"minValue": 0,
|
|
"show": false,
|
|
"thresholdLabels": false,
|
|
"thresholdMarkers": true
|
|
},
|
|
"gridPos": {
|
|
"h": 3,
|
|
"w": 2,
|
|
"x": 0,
|
|
"y": 4
|
|
},
|
|
"id": 287,
|
|
"interval": null,
|
|
"links": [],
|
|
"mappingType": 1,
|
|
"mappingTypes": [
|
|
{
|
|
"name": "value to text",
|
|
"value": 1
|
|
},
|
|
{
|
|
"name": "range to text",
|
|
"value": 2
|
|
}
|
|
],
|
|
"maxDataPoints": 100,
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"nullText": null,
|
|
"postfix": "",
|
|
"postfixFontSize": "50%",
|
|
"prefix": "",
|
|
"prefixFontSize": "50%",
|
|
"rangeMaps": [
|
|
{
|
|
"from": "null",
|
|
"text": "N/A",
|
|
"to": "null"
|
|
}
|
|
],
|
|
"sparkline": {
|
|
"fillColor": "rgba(31, 118, 189, 0.18)",
|
|
"full": false,
|
|
"lineColor": "rgb(31, 120, 193)",
|
|
"show": false
|
|
},
|
|
"tableColumn": "",
|
|
"targets": [
|
|
{
|
|
"expr": "count(count(node_cpu_seconds_total{job=~\"$job\"}) without (mode))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"refId": "A",
|
|
"step": 900
|
|
}
|
|
],
|
|
"thresholds": "",
|
|
"title": "Total Cores",
|
|
"type": "singlestat",
|
|
"valueFontSize": "50%",
|
|
"valueMaps": [
|
|
{
|
|
"op": "=",
|
|
"text": "N/A",
|
|
"value": "null"
|
|
}
|
|
],
|
|
"valueName": "current"
|
|
},
|
|
{
|
|
"collapsed": true,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 7
|
|
},
|
|
"id": 298,
|
|
"panels": [
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "Core usage for containers",
|
|
"editable": true,
|
|
"error": false,
|
|
"fill": 0,
|
|
"grid": {},
|
|
"gridPos": {
|
|
"h": 13,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 32
|
|
},
|
|
"height": "",
|
|
"id": 302,
|
|
"isNew": true,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideEmpty": false,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": null,
|
|
"sort": "current",
|
|
"sortDesc": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 2,
|
|
"links": [],
|
|
"nullPointMode": "connected",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(rate(container_cpu_usage_seconds_total{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}[1m])) by (name, image, job, instance)",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"interval": "10s",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
|
|
"metric": "container_cpu",
|
|
"refId": "A",
|
|
"step": 10
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Container Core Usage (1m avg)",
|
|
"tooltip": {
|
|
"msResolution": true,
|
|
"shared": true,
|
|
"sort": 2,
|
|
"value_type": "cumulative"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "none",
|
|
"label": "cores",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "Container Memory Usage (Working Set Size)",
|
|
"editable": true,
|
|
"error": false,
|
|
"fill": 0,
|
|
"grid": {},
|
|
"gridPos": {
|
|
"h": 13,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 32
|
|
},
|
|
"height": "200px",
|
|
"id": 303,
|
|
"isNew": true,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 200,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 2,
|
|
"links": [],
|
|
"nullPointMode": "connected",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(container_memory_working_set_bytes{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}) by (name, image, job, instance)",
|
|
"format": "time_series",
|
|
"interval": "10s",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
|
|
"refId": "C"
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Container Memory Usage (1m avg)",
|
|
"tooltip": {
|
|
"msResolution": false,
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "cumulative"
|
|
},
|
|
"transparent": false,
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "decbytes",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "Bps",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "Container Network I/O",
|
|
"editable": true,
|
|
"error": false,
|
|
"fill": 0,
|
|
"grid": {},
|
|
"gridPos": {
|
|
"h": 13,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 45
|
|
},
|
|
"height": "200px",
|
|
"id": 296,
|
|
"isNew": true,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 200,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 2,
|
|
"links": [],
|
|
"nullPointMode": "connected",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(rate(container_network_receive_bytes_total{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}[1m])) by (name, image, job, instance)",
|
|
"format": "time_series",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
|
|
"refId": "C"
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Container Network I/O (1m avg)",
|
|
"tooltip": {
|
|
"msResolution": false,
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "cumulative"
|
|
},
|
|
"transparent": false,
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "Bps",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "Bps",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "Container Disk Usage",
|
|
"editable": true,
|
|
"error": false,
|
|
"fill": 0,
|
|
"grid": {},
|
|
"gridPos": {
|
|
"h": 13,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 45
|
|
},
|
|
"height": "200px",
|
|
"id": 304,
|
|
"isNew": true,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": false,
|
|
"min": false,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 200,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 2,
|
|
"links": [],
|
|
"nullPointMode": "connected",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(container_fs_usage_bytes{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}) by (name, image, job, instance)",
|
|
"format": "time_series",
|
|
"interval": "10s",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
|
|
"refId": "C"
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Container Disk Usage (1m avg)",
|
|
"tooltip": {
|
|
"msResolution": false,
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "cumulative"
|
|
},
|
|
"transparent": false,
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "decbytes",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "Bps",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "Container Write Usage",
|
|
"editable": true,
|
|
"error": false,
|
|
"fill": 0,
|
|
"grid": {},
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 58
|
|
},
|
|
"height": "200px",
|
|
"id": 305,
|
|
"isNew": true,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": false,
|
|
"min": false,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 200,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 2,
|
|
"links": [],
|
|
"nullPointMode": "connected",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(container_fs_writes_bytes_total{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}) by (name, image, job, instance)",
|
|
"format": "time_series",
|
|
"interval": "10s",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
|
|
"refId": "C"
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Container Aggregate Write (1m avg)",
|
|
"tooltip": {
|
|
"msResolution": false,
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "cumulative"
|
|
},
|
|
"transparent": false,
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "decbytes",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"decimals": null,
|
|
"format": "none",
|
|
"label": "",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "Container Read Usage",
|
|
"editable": true,
|
|
"error": false,
|
|
"fill": 0,
|
|
"grid": {},
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 58
|
|
},
|
|
"height": "200px",
|
|
"id": 306,
|
|
"isNew": true,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": false,
|
|
"min": false,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 200,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 2,
|
|
"links": [],
|
|
"nullPointMode": "connected",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(container_fs_reads_bytes_total{image!=\"\",instance=~\"($node):$port_ca\",job=~\"$job\"}) by (name, image, job, instance)",
|
|
"format": "time_series",
|
|
"interval": "10s",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "{{name}}: {{image}} ({{job}}: {{instance}})",
|
|
"refId": "C"
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Container Aggregate Read (1m avg)",
|
|
"tooltip": {
|
|
"msResolution": false,
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "cumulative"
|
|
},
|
|
"transparent": false,
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "decbytes",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"decimals": null,
|
|
"format": "none",
|
|
"label": "",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
}
|
|
],
|
|
"title": "Container Metrics",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"collapsed": true,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 8
|
|
},
|
|
"id": 263,
|
|
"panels": [
|
|
{
|
|
"aliasColors": {
|
|
"Idle - Waiting for something to happen": "#052B51",
|
|
"guest": "#9AC48A",
|
|
"idle": "#052B51",
|
|
"iowait": "#EAB839",
|
|
"irq": "#BF1B00",
|
|
"nice": "#C15C17",
|
|
"softirq": "#E24D42",
|
|
"steal": "#FCE2DE",
|
|
"system": "#508642",
|
|
"user": "#5195CE"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "",
|
|
"fill": 4,
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 9
|
|
},
|
|
"id": 3,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 250,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": true,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"repeat": null,
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": true,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode=\"system\",instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"interval": "10s",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "System - Processes executing in kernel mode",
|
|
"refId": "A",
|
|
"step": 20
|
|
},
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='user',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "User - Normal processes executing in user mode",
|
|
"refId": "B",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='nice',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Nice - Niced processes executing in user mode",
|
|
"refId": "C",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='idle',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Idle - Waiting for something to happen",
|
|
"refId": "F",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='iowait',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Iowait - Waiting for I/O to complete",
|
|
"refId": "D",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='irq',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Irq - Servicing interrupts",
|
|
"refId": "G",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='softirq',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Softirq - Servicing softirqs",
|
|
"refId": "H",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='steal',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Steal - Time spent in other operating systems when running in a virtualized environment",
|
|
"refId": "E",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum by (mode)(irate(node_cpu_seconds_total{mode='guest',instance=~\"($node):$port\",job=~\"$job\"}[5m])) * 100",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Guest - Time spent running a virtual CPU for a guest operating system",
|
|
"refId": "I",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "CPU",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"transparent": false,
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Percentage",
|
|
"logBase": 1,
|
|
"max": "100",
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {
|
|
"Apps": "#629E51",
|
|
"Buffers": "#614D93",
|
|
"Cache": "#6D1F62",
|
|
"Cached": "#511749",
|
|
"Committed": "#508642",
|
|
"Free": "#0A437C",
|
|
"Harware Corrupted - Amount of RAM that the kernel identified as corrupted / not working": "#CFFAFF",
|
|
"Inactive": "#584477",
|
|
"PageTables": "#0A50A1",
|
|
"Page_Tables": "#0A50A1",
|
|
"RAM_Free": "#E0F9D7",
|
|
"Slab": "#806EB7",
|
|
"Slab_Cache": "#E0752D",
|
|
"Swap": "#BF1B00",
|
|
"Swap - Swap memory usage": "#BF1B00",
|
|
"Swap_Cache": "#C15C17",
|
|
"Swap_Free": "#2F575E",
|
|
"Unused": "#EAB839",
|
|
"Unused - Free memory unasigned": "#052B51"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 2,
|
|
"description": "",
|
|
"fill": 4,
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 9
|
|
},
|
|
"id": 24,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 350,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*Harware Corrupted - *./",
|
|
"stack": false
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": true,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_memory_MemTotal_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_MemFree_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_Buffers_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_Cached_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_Slab_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_PageTables_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_SwapCached_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Apps - Memory used by user-space applications",
|
|
"refId": "Q",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_memory_PageTables_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "PageTables - Memory used to map between virtual and physical memory addresses",
|
|
"refId": "G",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_memory_SwapCached_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "SwapCache - Memory that keeps track of pages that have been fetched from swap but not yet been modified",
|
|
"refId": "F",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_memory_Slab_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Slab - Memory used by the kernel to cache data structures for its own use (caches like inode, dentry, etc)",
|
|
"refId": "E",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_memory_Cached_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Cache - Parked file data (file content) cache",
|
|
"refId": "C",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_memory_Buffers_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Buffers - Block device (e.g. harddisk) cache",
|
|
"refId": "B",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_memory_MemFree_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Unused - Free memory unasigned",
|
|
"refId": "D",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "(node_memory_SwapTotal_bytes{instance=~\"($node):$port\",job=~\"$job\"} - node_memory_SwapFree_bytes{instance=~\"($node):$port\",job=~\"$job\"})",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Swap - Swap space used",
|
|
"refId": "I",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_memory_HardwareCorrupted_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Harware Corrupted - Amount of RAM that the kernel identified as corrupted / not working",
|
|
"refId": "O",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Memory Stack",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "bytes",
|
|
"label": "Bytes",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {
|
|
"receive_packets_eth0": "#7EB26D",
|
|
"receive_packets_lo": "#E24D42",
|
|
"transmit_packets_eth0": "#7EB26D",
|
|
"transmit_packets_lo": "#E24D42"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 4,
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 21
|
|
},
|
|
"id": 84,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*Trans.*/",
|
|
"transform": "negative-Y"
|
|
},
|
|
{
|
|
"alias": "/.*lo.*/",
|
|
"color": "#7EB26D"
|
|
},
|
|
{
|
|
"alias": "/.*eth0.*/",
|
|
"color": "#EAB839"
|
|
},
|
|
{
|
|
"alias": "/.*eth1.*/",
|
|
"color": "#6ED0E0"
|
|
},
|
|
{
|
|
"alias": "/.*eth2.*/",
|
|
"color": "#EF843C"
|
|
},
|
|
{
|
|
"alias": "/.*eth3.*/",
|
|
"color": "#E24D42"
|
|
},
|
|
{
|
|
"alias": "/.*eth4.*/",
|
|
"color": "#1F78C1"
|
|
},
|
|
{
|
|
"alias": "/.*eth5.*/",
|
|
"color": "#BA43A9"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "irate(node_network_receive_bytes_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Receive",
|
|
"refId": "O",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "irate(node_network_transmit_bytes_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Transmit",
|
|
"refId": "P",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Network Traffic",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "Bps",
|
|
"label": "Bytes out (-) / in (+)",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
}
|
|
],
|
|
"repeat": null,
|
|
"title": "CPU/Memory/Network Detailed Overview",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"collapsed": true,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 9
|
|
},
|
|
"id": 271,
|
|
"panels": [
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 3,
|
|
"description": "",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 10
|
|
},
|
|
"id": 43,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_filesystem_avail_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{mountpoint}} - Available",
|
|
"metric": "",
|
|
"refId": "A",
|
|
"step": 4
|
|
},
|
|
{
|
|
"expr": "node_filesystem_free_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
|
|
"format": "time_series",
|
|
"hide": true,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{mountpoint}} - Free",
|
|
"refId": "B",
|
|
"step": 2
|
|
},
|
|
{
|
|
"expr": "node_filesystem_size_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
|
|
"format": "time_series",
|
|
"hide": true,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{mountpoint}} - Size",
|
|
"refId": "D",
|
|
"step": 2
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Filesystem space available",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "bytes",
|
|
"label": "Bytes",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"description": "",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 10
|
|
},
|
|
"id": 41,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideZero": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_filesystem_files_free{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{mountpoint}} - Free file nodes",
|
|
"refId": "B",
|
|
"step": 4
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "File Nodes Free",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "File Nodes",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"description": "",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 20
|
|
},
|
|
"id": 28,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_filefd_maximum{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 4,
|
|
"legendFormat": "Max open files",
|
|
"refId": "A",
|
|
"step": 8
|
|
},
|
|
{
|
|
"expr": "node_filefd_allocated{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Open files",
|
|
"refId": "B",
|
|
"step": 4
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "File Descriptor",
|
|
"tooltip": {
|
|
"shared": false,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Files",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"description": "",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 20
|
|
},
|
|
"id": 219,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideZero": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_filesystem_files{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{mountpoint}} - File nodes total",
|
|
"refId": "A",
|
|
"step": 4
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "File Nodes Size",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "File Nodes",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
}
|
|
],
|
|
"repeat": null,
|
|
"title": "Filesystem Metrics",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"collapsed": true,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 10
|
|
},
|
|
"id": 265,
|
|
"panels": [
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 3,
|
|
"description": "",
|
|
"fill": 4,
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 9
|
|
},
|
|
"height": "",
|
|
"id": 156,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sort": "current",
|
|
"sortDesc": false,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_filesystem_size_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'} - node_filesystem_avail_bytes{instance=~\"($node):$port\",job=~\"$job\",device!~'rootfs'}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{mountpoint}}",
|
|
"refId": "A",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Disk Space Used",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "bytes",
|
|
"label": "Bytes",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {
|
|
"io time": "#890F02"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 3,
|
|
"description": "",
|
|
"fill": 4,
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 9
|
|
},
|
|
"id": 42,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*read*./",
|
|
"transform": "negative-Y"
|
|
},
|
|
{
|
|
"alias": "/.*sda.*/",
|
|
"color": "#7EB26D"
|
|
},
|
|
{
|
|
"alias": "/.*sdb.*/",
|
|
"color": "#EAB839"
|
|
},
|
|
{
|
|
"alias": "/.*sdc.*/",
|
|
"color": "#6ED0E0"
|
|
},
|
|
{
|
|
"alias": "/.*sdd.*/",
|
|
"color": "#EF843C"
|
|
},
|
|
{
|
|
"alias": "/.*sde.*/",
|
|
"color": "#E24D42"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "irate(node_disk_read_bytes_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"}[5m])",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Successfully read bytes",
|
|
"refId": "A",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "irate(node_disk_written_bytes_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"}[5m])",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Successfully written bytes",
|
|
"refId": "B",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "I/O Usage Read / Write",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": false,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "bytes",
|
|
"label": "Bytes read (-) / write (+)",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "ms",
|
|
"label": "",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"description": "",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 21
|
|
},
|
|
"id": 229,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideZero": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*Read.*/",
|
|
"transform": "negative-Y"
|
|
},
|
|
{
|
|
"alias": "/.*sda_.*/",
|
|
"color": "#7EB26D"
|
|
},
|
|
{
|
|
"alias": "/.*sdb_.*/",
|
|
"color": "#EAB839"
|
|
},
|
|
{
|
|
"alias": "/.*sdc_.*/",
|
|
"color": "#6ED0E0"
|
|
},
|
|
{
|
|
"alias": "/.*sdd_.*/",
|
|
"color": "#EF843C"
|
|
},
|
|
{
|
|
"alias": "/.*sde_.*/",
|
|
"color": "#E24D42"
|
|
},
|
|
{
|
|
"alias": "/.*sda1.*/",
|
|
"color": "#584477"
|
|
},
|
|
{
|
|
"alias": "/.*sda2_.*/",
|
|
"color": "#BA43A9"
|
|
},
|
|
{
|
|
"alias": "/.*sda3_.*/",
|
|
"color": "#F4D598"
|
|
},
|
|
{
|
|
"alias": "/.*sdb1.*/",
|
|
"color": "#0A50A1"
|
|
},
|
|
{
|
|
"alias": "/.*sdb2.*/",
|
|
"color": "#BF1B00"
|
|
},
|
|
{
|
|
"alias": "/.*sdb3.*/",
|
|
"color": "#E0752D"
|
|
},
|
|
{
|
|
"alias": "/.*sdc1.*/",
|
|
"color": "#962D82"
|
|
},
|
|
{
|
|
"alias": "/.*sdc2.*/",
|
|
"color": "#614D93"
|
|
},
|
|
{
|
|
"alias": "/.*sdc3.*/",
|
|
"color": "#9AC48A"
|
|
},
|
|
{
|
|
"alias": "/.*sdd1.*/",
|
|
"color": "#65C5DB"
|
|
},
|
|
{
|
|
"alias": "/.*sdd2.*/",
|
|
"color": "#F9934E"
|
|
},
|
|
{
|
|
"alias": "/.*sdd3.*/",
|
|
"color": "#EA6460"
|
|
},
|
|
{
|
|
"alias": "/.*sde1.*/",
|
|
"color": "#E0F9D7"
|
|
},
|
|
{
|
|
"alias": "/.*sdd2.*/",
|
|
"color": "#FCEACA"
|
|
},
|
|
{
|
|
"alias": "/.*sde3.*/",
|
|
"color": "#F9E2D2"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "irate(node_disk_reads_completed_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 4,
|
|
"legendFormat": "{{device}} - Reads completed",
|
|
"refId": "A",
|
|
"step": 480
|
|
},
|
|
{
|
|
"expr": "irate(node_disk_writes_completed_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Writes completed",
|
|
"refId": "B",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Disk IOps",
|
|
"tooltip": {
|
|
"shared": false,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "iops",
|
|
"label": "IO read (-) / write (+)",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {
|
|
"io time": "#890F02"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"decimals": 3,
|
|
"description": "",
|
|
"fill": 4,
|
|
"gridPos": {
|
|
"h": 12,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 21
|
|
},
|
|
"id": 127,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sort": null,
|
|
"sortDesc": null,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "irate(node_disk_io_time_seconds_total{instance=~\"($node):$port\",job=~\"$job\",device=~\"[a-z]*[a-z]\"} [5m])",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Milliseconds spent doing I/Os",
|
|
"refId": "C",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "I/O Usage Times",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": false,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "ms",
|
|
"label": "Milliseconds",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "ms",
|
|
"label": "",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
}
|
|
],
|
|
"repeat": null,
|
|
"title": "Disk Metrics",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"collapsed": true,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 11
|
|
},
|
|
"id": 272,
|
|
"panels": [
|
|
{
|
|
"aliasColors": {
|
|
"receive_packets_eth0": "#7EB26D",
|
|
"receive_packets_lo": "#E24D42",
|
|
"transmit_packets_eth0": "#7EB26D",
|
|
"transmit_packets_lo": "#E24D42"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 12
|
|
},
|
|
"id": 60,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 300,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*Trans.*/",
|
|
"transform": "negative-Y"
|
|
},
|
|
{
|
|
"alias": "/.*lo.*/",
|
|
"color": "#7EB26D"
|
|
},
|
|
{
|
|
"alias": "/.*eth0.*/",
|
|
"color": "#EAB839"
|
|
},
|
|
{
|
|
"alias": "/.*eth1.*/",
|
|
"color": "#6ED0E0"
|
|
},
|
|
{
|
|
"alias": "/.*eth2.*/",
|
|
"color": "#EF843C"
|
|
},
|
|
{
|
|
"alias": "/.*eth3.*/",
|
|
"color": "#E24D42"
|
|
},
|
|
{
|
|
"alias": "/.*eth4.*/",
|
|
"color": "#1F78C1"
|
|
},
|
|
{
|
|
"alias": "/.*eth5.*/",
|
|
"color": "#BA43A9"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "irate(node_network_receive_packets_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Receive",
|
|
"refId": "O",
|
|
"step": 4
|
|
},
|
|
{
|
|
"expr": "irate(node_network_transmit_packets_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Transmit",
|
|
"refId": "P",
|
|
"step": 4
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Network Traffic by Packets",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "pps",
|
|
"label": "Packets out (-) / in (+)",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 12
|
|
},
|
|
"id": 142,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideEmpty": false,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 300,
|
|
"sort": "current",
|
|
"sortDesc": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*Trans.*/",
|
|
"transform": "negative-Y"
|
|
},
|
|
{
|
|
"alias": "/.*lo.*.errors.*/",
|
|
"color": "#7EB26D"
|
|
},
|
|
{
|
|
"alias": "/.*eth0.*.errors.*/",
|
|
"color": "#EAB839"
|
|
},
|
|
{
|
|
"alias": "/.*eth1.*.errors.*/",
|
|
"color": "#6ED0E0"
|
|
},
|
|
{
|
|
"alias": "/.*eth2.*.errors.*/",
|
|
"color": "#EF843C"
|
|
},
|
|
{
|
|
"alias": "/.*eth3.*.errors.*/",
|
|
"color": "#E24D42"
|
|
},
|
|
{
|
|
"alias": "/.*eth4.*.errors.*/",
|
|
"color": "#1F78C1"
|
|
},
|
|
{
|
|
"alias": "/.*eth5.*.errors.*/",
|
|
"color": "#BA43A9"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "irate(node_network_receive_errs_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Receive errors",
|
|
"refId": "E",
|
|
"step": 4
|
|
},
|
|
{
|
|
"expr": "irate(node_network_transmit_errs_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Rransmit errors",
|
|
"refId": "F",
|
|
"step": 4
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Network Traffic Errors",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "pps",
|
|
"label": "Packets out (-) / in (+)",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 22
|
|
},
|
|
"id": 143,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideEmpty": false,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 300,
|
|
"sort": "current",
|
|
"sortDesc": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*Trans.*/",
|
|
"transform": "negative-Y"
|
|
},
|
|
{
|
|
"alias": "/.*lo.*.drop.*/",
|
|
"color": "#7EB26D"
|
|
},
|
|
{
|
|
"alias": "/.*eth0.*.drop.*/",
|
|
"color": "#EAB839"
|
|
},
|
|
{
|
|
"alias": "/.*eth1.*.drop.*/",
|
|
"color": "#6ED0E0"
|
|
},
|
|
{
|
|
"alias": "/.*eth2.*.drop.*/",
|
|
"color": "#EF843C"
|
|
},
|
|
{
|
|
"alias": "/.*eth3.*.drop.*/",
|
|
"color": "#E24D42"
|
|
},
|
|
{
|
|
"alias": "/.*eth4.*.drop.*/",
|
|
"color": "#1F78C1"
|
|
},
|
|
{
|
|
"alias": "/.*eth5.*.drop.*/",
|
|
"color": "#BA43A9"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "irate(node_network_receive_drop_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Receive drop",
|
|
"refId": "G",
|
|
"step": 4
|
|
},
|
|
{
|
|
"expr": "irate(node_network_transmit_drop_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{device}} - Transmit drop",
|
|
"refId": "H",
|
|
"step": 4
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Network Traffic Drop",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "pps",
|
|
"label": "Packets out (-) / in (+)",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 22
|
|
},
|
|
"id": 61,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "NF conntrack limit",
|
|
"color": "#890F02",
|
|
"fill": 0
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_nf_conntrack_entries{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "NF conntrack entries",
|
|
"refId": "O",
|
|
"step": 4
|
|
},
|
|
{
|
|
"expr": "node_nf_conntrack_entries_limit{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "NF conntrack limit",
|
|
"refId": "P",
|
|
"step": 4
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "NF Contrack",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Entries",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 32
|
|
},
|
|
"id": 63,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideEmpty": false,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 300,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_sockstat_TCP_alloc{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "TCP_alloc - Allocated sockets",
|
|
"refId": "D",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_sockstat_TCP_inuse{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "TCP_inuse - Tcp sockets currently in use",
|
|
"refId": "E",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_sockstat_TCP_mem{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "TCP_mem - Used memory for tcp",
|
|
"refId": "F",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_sockstat_TCP_orphan{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "TCP_orphan - Orphan sockets",
|
|
"refId": "H",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_sockstat_TCP_tw{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "TCP_tw - Sockets wating close",
|
|
"refId": "I",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Sockstat TCP",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Sockets",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 32
|
|
},
|
|
"id": 124,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideEmpty": false,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 300,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_sockstat_UDPLITE_inuse{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "UDPLITE_inuse - Udplite sockets currently in use",
|
|
"refId": "J",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_sockstat_UDP_inuse{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "UDP_inuse - Udp sockets currently in use",
|
|
"refId": "K",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_sockstat_UDP_mem{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "UDP_mem - Used memory for udp",
|
|
"refId": "L",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Sockstat UDP",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Sockets",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 42
|
|
},
|
|
"id": 126,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideEmpty": false,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 300,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_sockstat_sockets_used{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Sockets_used - Sockets currently in use",
|
|
"refId": "N",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Sockstat Used",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Sockets",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 42
|
|
},
|
|
"id": 220,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideEmpty": false,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sideWidth": 300,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_sockstat_TCP_mem_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "TCP_mem_bytes - ",
|
|
"refId": "G",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_sockstat_UDP_mem_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "UDP_mem_bytes - ",
|
|
"refId": "A",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Sockstat Memory Size",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "bytes",
|
|
"label": "Bytes",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
}
|
|
],
|
|
"repeat": null,
|
|
"title": "Network Detailed Metrics",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"collapsed": true,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 12
|
|
},
|
|
"id": 269,
|
|
"panels": [
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 13
|
|
},
|
|
"id": 7,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"repeat": null,
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_load1{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 4,
|
|
"legendFormat": "Load 1m",
|
|
"refId": "A",
|
|
"step": 480
|
|
},
|
|
{
|
|
"expr": "node_load5{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 4,
|
|
"legendFormat": "Load 5m",
|
|
"refId": "B",
|
|
"step": 480
|
|
},
|
|
{
|
|
"expr": "node_load15{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 4,
|
|
"legendFormat": "Load 15m",
|
|
"refId": "C",
|
|
"step": 480
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "System Load",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Load",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 13
|
|
},
|
|
"id": 62,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_procs_blocked{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Processes blocked waiting for I/O to complete",
|
|
"refId": "A",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_procs_running{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Processes in runnable state",
|
|
"refId": "B",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Processes State",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Processes",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 23
|
|
},
|
|
"id": 149,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "process_virtual_memory_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"interval": "",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Processes virtual memory size in bytes",
|
|
"refId": "C",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "process_resident_memory_bytes{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"interval": "",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Processes resident memory size in bytes",
|
|
"refId": "A",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Processes Memory",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "decbytes",
|
|
"label": "Bytes",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 23
|
|
},
|
|
"id": 64,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*Max*./",
|
|
"color": "#890F02",
|
|
"fill": 0
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "process_max_fds{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"interval": "",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Maximum open file descriptors",
|
|
"refId": "A",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "process_open_fds{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"interval": "",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Open file descriptors",
|
|
"refId": "B",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "File Descriptors",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Descriptors",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 33
|
|
},
|
|
"id": 8,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"repeat": null,
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "irate(node_context_switches_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Context switches",
|
|
"refId": "A",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "irate(node_intr_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Interrupts",
|
|
"refId": "B",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Context Switches / Interrupts",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Counter",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 33
|
|
},
|
|
"id": 148,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 4,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "rate(node_forks_total{instance=~\"($node):$port\",job=~\"$job\"}[5m])",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Processes forks second",
|
|
"refId": "C",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Processes Forks",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Forks / sec",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"description": "",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 43
|
|
},
|
|
"id": 260,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "/.*Variation*./",
|
|
"color": "#890F02"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_timex_estimated_error_seconds{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"interval": "",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Estimated error in seconds",
|
|
"refId": "B",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_timex_offset_seconds{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"interval": "",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Time offset in between local system and reference clock",
|
|
"refId": "A",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "node_timex_maxerror_seconds{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"interval": "",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "Maximum error in seconds",
|
|
"refId": "C",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "Time Syncronized Drift",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "s",
|
|
"label": "Seconds",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
}
|
|
],
|
|
"repeat": null,
|
|
"title": "System Metrics",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"collapsed": true,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 13
|
|
},
|
|
"id": 314,
|
|
"panels": [
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 14
|
|
},
|
|
"height": "",
|
|
"id": 316,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sortDesc": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 2,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_mountstats_nfs_transport_connect_total{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"instant": false,
|
|
"interval": "",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "NFS client connections",
|
|
"refId": "C",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "NFS Client Connections",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Connections",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {
|
|
"receive_packets_eth0": "#7EB26D",
|
|
"receive_packets_lo": "#E24D42",
|
|
"transmit_packets_eth0": "#7EB26D",
|
|
"transmit_packets_lo": "#E24D42"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 3,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 14
|
|
},
|
|
"id": 315,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "Read",
|
|
"transform": "negative-Y"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(rate(node_mountstats_nfs_write_bytes_total{instance=~\"($node):$port\",job=~\"$job\"}[1m]))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"instant": false,
|
|
"interval": "",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "Write",
|
|
"refId": "A",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum(rate(node_mountstats_nfs_read_bytes_total{instance=~\"($node):$port\",job=~\"$job\"}[1m]))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"interval": "",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "Read",
|
|
"refId": "B"
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "NFS Client I/O",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "Bps",
|
|
"label": "",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
}
|
|
],
|
|
"title": "NFS Client Metrics",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"collapsed": true,
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 14
|
|
},
|
|
"id": 310,
|
|
"panels": [
|
|
{
|
|
"aliasColors": {},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 2,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 15
|
|
},
|
|
"height": "",
|
|
"id": 308,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"hideZero": false,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"sortDesc": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"minSpan": 2,
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "node_nfsd_connections_total{instance=~\"($node):$port\",job=~\"$job\"}",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"instant": false,
|
|
"interval": "",
|
|
"intervalFactor": 1,
|
|
"legendFormat": "NFS kernel server connections",
|
|
"refId": "C",
|
|
"step": 240
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "NFS Kernel Server Connections",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "short",
|
|
"label": "Connections",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": "0",
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
},
|
|
{
|
|
"aliasColors": {
|
|
"receive_packets_eth0": "#7EB26D",
|
|
"receive_packets_lo": "#E24D42",
|
|
"transmit_packets_eth0": "#7EB26D",
|
|
"transmit_packets_lo": "#E24D42"
|
|
},
|
|
"bars": false,
|
|
"dashLength": 10,
|
|
"dashes": false,
|
|
"datasource": "Prometheus",
|
|
"fill": 3,
|
|
"gridPos": {
|
|
"h": 10,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 15
|
|
},
|
|
"id": 312,
|
|
"legend": {
|
|
"alignAsTable": true,
|
|
"avg": true,
|
|
"current": true,
|
|
"max": true,
|
|
"min": true,
|
|
"rightSide": false,
|
|
"show": true,
|
|
"total": false,
|
|
"values": true
|
|
},
|
|
"lines": true,
|
|
"linewidth": 1,
|
|
"links": [],
|
|
"nullPointMode": "null",
|
|
"percentage": false,
|
|
"pointradius": 5,
|
|
"points": false,
|
|
"renderer": "flot",
|
|
"seriesOverrides": [
|
|
{
|
|
"alias": "Read",
|
|
"transform": "negative-Y"
|
|
}
|
|
],
|
|
"spaceLength": 10,
|
|
"stack": false,
|
|
"steppedLine": false,
|
|
"targets": [
|
|
{
|
|
"expr": "sum(rate(node_nfsd_disk_bytes_written_total{instance=~\"($node):$port\",job=~\"$job\"}[1m]))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"legendFormat": "Write",
|
|
"refId": "A",
|
|
"step": 240
|
|
},
|
|
{
|
|
"expr": "sum(rate(node_nfsd_disk_bytes_read_total{instance=~\"($node):$port\",job=~\"$job\"}[1m]))",
|
|
"format": "time_series",
|
|
"hide": false,
|
|
"intervalFactor": 1,
|
|
"legendFormat": "Read",
|
|
"refId": "B"
|
|
}
|
|
],
|
|
"thresholds": [],
|
|
"timeFrom": null,
|
|
"timeShift": null,
|
|
"title": "NFS Kernel Server I/O",
|
|
"tooltip": {
|
|
"shared": true,
|
|
"sort": 0,
|
|
"value_type": "individual"
|
|
},
|
|
"type": "graph",
|
|
"xaxis": {
|
|
"buckets": null,
|
|
"mode": "time",
|
|
"name": null,
|
|
"show": true,
|
|
"values": []
|
|
},
|
|
"yaxes": [
|
|
{
|
|
"format": "Bps",
|
|
"label": "",
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": true
|
|
},
|
|
{
|
|
"format": "short",
|
|
"label": null,
|
|
"logBase": 1,
|
|
"max": null,
|
|
"min": null,
|
|
"show": false
|
|
}
|
|
],
|
|
"yaxis": {
|
|
"align": false,
|
|
"alignLevel": null
|
|
}
|
|
}
|
|
],
|
|
"title": "NFS Kernel Server Metrics",
|
|
"type": "row"
|
|
}
|
|
],
|
|
"refresh": "5s",
|
|
"schemaVersion": 16,
|
|
"style": "dark",
|
|
"tags": [],
|
|
"templating": {
|
|
"list": [
|
|
{
|
|
"allValue": null,
|
|
"current": {},
|
|
"datasource": "Prometheus",
|
|
"hide": 0,
|
|
"includeAll": true,
|
|
"label": "Resource",
|
|
"multi": false,
|
|
"name": "job",
|
|
"options": [],
|
|
"query": "label_values(node_boot_time_seconds, job)",
|
|
"refresh": 2,
|
|
"regex": "",
|
|
"sort": 1,
|
|
"tagValuesQuery": "",
|
|
"tags": [],
|
|
"tagsQuery": "",
|
|
"type": "query",
|
|
"useTags": false
|
|
},
|
|
{
|
|
"allValue": null,
|
|
"current": {},
|
|
"datasource": "Prometheus",
|
|
"hide": 0,
|
|
"includeAll": true,
|
|
"label": "Node",
|
|
"multi": false,
|
|
"name": "node",
|
|
"options": [],
|
|
"query": "label_values(node_boot_time_seconds{job=~\"$job\"}, instance)",
|
|
"refresh": 2,
|
|
"regex": "/([^:]+):.*/",
|
|
"sort": 1,
|
|
"tagValuesQuery": "",
|
|
"tags": [],
|
|
"tagsQuery": "",
|
|
"type": "query",
|
|
"useTags": false
|
|
},
|
|
{
|
|
"allValue": null,
|
|
"current": {},
|
|
"datasource": "Prometheus",
|
|
"hide": 2,
|
|
"includeAll": false,
|
|
"label": "Port (NE)",
|
|
"multi": false,
|
|
"name": "port",
|
|
"options": [],
|
|
"query": "label_values(node_boot_time_seconds{instance=~\"$node:(.*)\"}, instance)",
|
|
"refresh": 2,
|
|
"regex": "/[^:]+:(.*)/",
|
|
"sort": 3,
|
|
"tagValuesQuery": "",
|
|
"tags": [],
|
|
"tagsQuery": "",
|
|
"type": "query",
|
|
"useTags": false
|
|
},
|
|
{
|
|
"allValue": null,
|
|
"current": {},
|
|
"datasource": "Prometheus",
|
|
"hide": 2,
|
|
"includeAll": false,
|
|
"label": "Port (CA)",
|
|
"multi": false,
|
|
"name": "port_ca",
|
|
"options": [],
|
|
"query": "label_values(cadvisor_version_info{instance=~\"$node:(.*)\"}, instance)",
|
|
"refresh": 2,
|
|
"regex": "/[^:]+:(.*)/",
|
|
"sort": 0,
|
|
"tagValuesQuery": "",
|
|
"tags": [],
|
|
"tagsQuery": "",
|
|
"type": "query",
|
|
"useTags": false
|
|
}
|
|
]
|
|
},
|
|
"time": {
|
|
"from": "now-15m",
|
|
"to": "now"
|
|
},
|
|
"timepicker": {
|
|
"refresh_intervals": [
|
|
"5s",
|
|
"10s",
|
|
"30s",
|
|
"1m",
|
|
"5m",
|
|
"15m",
|
|
"30m",
|
|
"1h",
|
|
"2h",
|
|
"1d"
|
|
],
|
|
"time_options": [
|
|
"5m",
|
|
"15m",
|
|
"1h",
|
|
"6h",
|
|
"12h",
|
|
"24h",
|
|
"2d",
|
|
"7d",
|
|
"30d"
|
|
]
|
|
},
|
|
"timezone": "utc",
|
|
"title": "Batch Shipyard Dashboard",
|
|
"uid": "absdash",
|
|
"version": 1
|
|
}
|