diff --git a/k8s_overview.json b/k8s_overview.json index 51ed63d..b62214f 100644 --- a/k8s_overview.json +++ b/k8s_overview.json @@ -1,8603 +1,8801 @@ { - "annotations": { - "list": [ - { - "builtIn": 1, - "datasource": { - "type": "grafana", - "uid": "-- Grafana --" - }, - "enable": true, - "hide": true, - "iconColor": "rgba(0, 211, 255, 1)", - "name": "Annotations & Alerts", - "type": "dashboard" - } - ] + "annotations": { + "list": [ + { + "builtIn": 1, + "datasource": { + "type": "grafana", + "uid": "-- Grafana --" + }, + "enable": true, + "hide": true, + "iconColor": "rgba(0, 211, 255, 1)", + "name": "Annotations & Alerts", + "type": "dashboard" + } + ] + }, + "description": "This dashboard is designed to be a one-stop solution for monitoring your Kubernetes cluster", + "editable": true, + "fiscalYearStartMonth": 0, + "graphTooltip": 0, + "id": 38, + "links": [], + "panels": [ + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 38, + "panels": [], + "title": "Cluster Health", + "type": "row" }, - "description": "This dashboard is designed to be a one-stop solution for monitoring your Kubernetes cluster", - "editable": false, - "fiscalYearStartMonth": 0, - "graphTooltip": 0, - "id": 50, - "links": [], - "panels": [ - { - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 0 + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 4, + "x": 0, + "y": 1 + }, + "id": 109, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false }, - "id": 38, - "panels": [ - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 4, - "x": 0, - "y": 1 - }, - "id": 109, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

API Server

\n
\n", - "mode": "html" - }, - "pluginVersion": "10.4.3", - "title": "", - "type": "text" + "content": "
\n

API Server

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 20, + "x": 4, + "y": 1 + }, + "id": 110, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

Nodes

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "datasource": { + "type": "prometheus", + "uid": "prom" + }, + "description": "Indicates whether API Server, Scheduler or Controller manager is down.", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" }, - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 20, - "x": 4, - "y": 1 - }, - "id": 110, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false + "mappings": [ + { + "options": { + "match": "null", + "result": { + "text": "UP" + } }, - "content": "
\n

Nodes

\n
\n", - "mode": "html" - }, - "pluginVersion": "10.4.3", - "title": "", - "type": "text" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Indicates whether API Server, Scheduler or Controller manager is down.", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "text": "UP" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 4, - "x": 0, - "y": 3 - }, - "id": 31, - "maxDataPoints": 100, - "options": { - "colorMode": "value", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "sum" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(up{job=~\"apiserver|kube-scheduler|kube-controller-manager\"} == 0)", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 } - ], - "title": "Control Plane Status", - "type": "stat" + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 0, + "y": 3 + }, + "id": 31, + "maxDataPoints": 100, + "options": { + "colorMode": "value", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "sum" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "prom" + }, + "editorMode": "code", + "expr": "sum(up{cluster=~\"$cluster\", job=~\"apiserver|kube-scheduler|kube-controller-manager\"} == 0)", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + } + ], + "title": "Control Plane Status", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 1 + }, + { + "color": "#d44a3a", + "value": 3 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 4, + "x": 4, + "y": 3 + }, + "id": 32, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_node_spec_unschedulable{cluster=~\"$cluster\"})", + "format": "time_series", + "interval": "", + "intervalFactor": 1, + "legendFormat": "", + "range": true, + "refId": "A" + } + ], + "title": "Node Unschedulable", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "This is true if there is insufficient memory on the node, which could cause the node to swap frequently.", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 1 + }, + { + "color": "#d44a3a" + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 8, + "y": 3 + }, + "id": 36, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"MemoryPressure\", status!=\"false\"})", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Memory Pressure", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "This condition is true if there is insufficient disk space on the node.", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 1 + }, + { + "color": "#d44a3a" + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 12, + "y": 3 + }, + "id": 34, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"DiskPressure\", status!=\"false\"})", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Disk Pressure", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "True when there are too many processes running on the node, indicating a potential exhaustion of process identifiers (PIDs).", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 1 + }, + { + "color": "#d44a3a" + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 16, + "y": 3 + }, + "id": 37, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"PIDPressure\", status!=\"false\"})", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "PID Pressure", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Indicates that the network to the node is not correctly configured or not available.", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 1 + }, + { + "color": "#d44a3a" + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 20, + "y": 3 + }, + "id": 35, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"NetworkUnavailable\", status!=\"false\"})", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Network Unavailable", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "text": "N/A" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 1 + }, + { + "color": "#d44a3a", + "value": 3 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 4, + "x": 4, + "y": 5 + }, + "id": 33, + "maxDataPoints": 100, + "options": { + "colorMode": "value", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"Ready\",status!=\"true\"})", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + } + ], + "title": "Node Not Ready", + "type": "stat" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 24, + "x": 0, + "y": 7 + }, + "id": 111, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

Pods

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 15Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "rgba(237, 129, 40, 0.89)", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 8, + "x": 0, + "y": 9 + }, + "id": 51, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(increase(kube_pod_status_phase{cluster=~\"$cluster\", phase=\"Failed\"}[15m]))", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Failed Pods", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Indicates that there are pods that were evicted", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 8, + "w": 16, + "x": 8, + "y": 9 + }, + "id": 102, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(increase(kube_pod_status_reason{cluster=~\"$cluster\"}[15m])) by (reason) ", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "__auto", + "range": true, + "refId": "A" + } + ], + "title": "Failed Pods Reason", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 15Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 8, + "x": 0, + "y": 13 + }, + "id": 53, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(increase(kube_pod_status_scheduled{cluster=~\"$cluster\", condition=\"false\"}[15m]))", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Unscheduled Pods", + "type": "stat" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 24, + "x": 0, + "y": 17 + }, + "id": 112, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

Containers

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 15Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 0, + "y": 19 + }, + "id": 105, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(increase(kube_pod_container_status_waiting_reason{cluster=~\"$cluster\", reason=\"CrashLoopBackOff\"}[15m]))", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "CrashLoopBackOff", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 15Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 4, + "y": 19 + }, + "id": 106, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(increase(kube_pod_container_status_waiting_reason{cluster=~\"$cluster\", reason=\"ErrImagePull\"}[15m]))", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "ErrImagePull", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 15Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 4, + "x": 8, + "y": 19 + }, + "id": 107, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(increase(kube_pod_container_status_waiting_reason{cluster=~\"$cluster\", reason=\"ImagePullBackOff\"}[15m]))", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "ImagePullBackOff", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 12, + "y": 19 + }, + "id": 108, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "kube_pod_container_status_last_terminated_reason{cluster=~\"$cluster\", reason=\"OOMKilled\"} == 1", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "OOM Killed Containers", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 15Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "color": "#299c46", + "text": "0" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "#299c46", + "value": 0 + }, + { + "color": "orange", + "value": 1 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 6, + "x": 18, + "y": 19 + }, + "id": 127, + "maxDataPoints": 100, + "options": { + "colorMode": "background", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "count(sum{cluster=~\"$cluster\"})", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Containers in CPU Throttling", + "type": "stat" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 24, + "x": 0, + "y": 23 + }, + "id": 113, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

Persistent Volume Claims

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [], + "noValue": "--", + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "semi-dark-red", + "value": 0 + }, + { + "color": "green", + "value": -0.0001 + }, + { + "color": "semi-dark-red", + "value": 0.0001 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 12, + "x": 0, + "y": 25 + }, + "id": 60, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "auto", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "mean" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "count (max by (persistentvolumeclaim,namespace) (kubelet_volume_stats_used_bytes{cluster=~\"$cluster\", } ) and (max by (persistentvolumeclaim,namespace) (kubelet_volume_stats_used_bytes{} )) / (max by (persistentvolumeclaim,namespace) (kubelet_volume_stats_capacity_bytes{} )) >= (80 / 100)) or vector (0)", + "instant": true, + "interval": "", + "legendFormat": "", + "refId": "A" + } + ], + "title": "PVCs Above 80%", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [], + "noValue": "--", + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "semi-dark-red", + "value": 0 + }, + { + "color": "green", + "value": -0.0001 + }, + { + "color": "semi-dark-red", + "value": 0.0001 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 4, + "w": 12, + "x": 12, + "y": 25 + }, + "id": 114, + "options": { + "colorMode": "background", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "auto", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "mean" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_persistentvolumeclaim_status_phase{cluster=~\"$cluster\", phase=\"Lost\"})", + "instant": true, + "interval": "", + "legendFormat": "", + "refId": "A" + } + ], + "title": "PVCs in Lost State", + "type": "stat" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 29 + }, + "id": 6, + "panels": [], + "title": "Global", + "type": "row" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 12, + "x": 0, + "y": 30 + }, + "id": 91, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

Memory Information

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 12, + "x": 12, + "y": 30 + }, + "id": 90, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

CPU Information

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "datasource": { + "type": "prometheus", + "uid": "prom" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "decimals": 1, + "mappings": [], + "max": 1, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 0.65 + }, + { + "color": "red", + "value": 0.8 + } + ] + }, + "unit": "percentunit" + }, + "overrides": [] + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 32 + }, + "id": 83, + "options": { + "displayMode": "lcd", + "legend": { + "calcs": [], + "displayMode": "list", + "placement": "bottom", + "showLegend": false + }, + "maxVizHeight": 300, + "minVizHeight": 16, + "minVizWidth": 8, + "namePlacement": "auto", + "orientation": "horizontal", + "reduceOptions": { + "calcs": [ + "last" + ], + "fields": "", + "values": false + }, + "showUnfilled": true, + "sizing": "auto", + "valueMode": "color" + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "prom" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(container_memory_working_set_bytes{cluster=~\"$cluster\", container!=\"\"}) / sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})", + "format": "time_series", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "Real", + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "prom" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"memory\", unit=\"byte\"}) / sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})", + "format": "time_series", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "Requests", + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "prom" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"memory\", unit=\"byte\"}) / sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})", + "format": "time_series", + "hide": false, + "instant": true, + "interval": "", + "intervalFactor": 1, + "legendFormat": "Limits", + "refId": "B", + "step": 10 + } + ], + "title": "Node Memory Ratio", + "type": "bargauge" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "decimals": 1, + "mappings": [], + "max": 1, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 0.65 + }, + { + "color": "red", + "value": 0.8 + } + ] + }, + "unit": "percentunit" + }, + "overrides": [] + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 32 + }, + "id": 82, + "options": { + "displayMode": "lcd", + "legend": { + "calcs": [], + "displayMode": "list", + "placement": "bottom", + "showLegend": false + }, + "maxVizHeight": 300, + "minVizHeight": 10, + "minVizWidth": 0, + "namePlacement": "auto", + "orientation": "horizontal", + "reduceOptions": { + "calcs": [ + "last" + ], + "fields": "", + "values": false + }, + "showUnfilled": false, + "sizing": "auto", + "text": {}, + "valueMode": "color" + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum (irate(container_cpu_usage_seconds_total{cluster=~\"$cluster\", container!=\"\"}[2m])) / sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})", + "format": "time_series", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "Real", + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"cpu\", unit=\"core\"}) / sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})", + "format": "time_series", + "instant": true, + "interval": "", + "legendFormat": "Requests", + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"cpu\", unit=\"core\"}) / sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})", + "format": "time_series", + "instant": true, + "interval": "", + "legendFormat": "Limits", + "refId": "B" + } + ], + "title": "Node CPU Ratio", + "type": "bargauge" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "decimals": 1, + "mappings": [], + "max": 2000000000000, + "min": 1, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "text", + "value": 0 + } + ] + }, + "unit": "bytes" + }, + "overrides": [] + }, + "gridPos": { + "h": 6, + "w": 12, + "x": 0, + "y": 39 + }, + "id": 84, + "options": { + "colorMode": "value", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "vertical", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "last" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_node_status_allocatable{cluster=~\"$cluster\", resource=\"memory\", unit=\"byte\"})", + "instant": true, + "interval": "", + "legendFormat": "Total Memory", + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum (container_memory_working_set_bytes{cluster=~\"$cluster\", container!=\"\"})", + "instant": true, + "interval": "", + "legendFormat": "Usage", + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"memory\", unit=\"byte\"})", + "instant": true, + "interval": "", + "legendFormat": "Requests", + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"memory\", unit=\"byte\"})", + "instant": true, + "interval": "", + "legendFormat": "Limits", + "refId": "B" + } + ], + "title": "Node Memory Information", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "decimals": 1, + "mappings": [], + "max": 500, + "min": 1, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "text", + "value": 0 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 6, + "w": 12, + "x": 12, + "y": 39 + }, + "id": 85, + "options": { + "colorMode": "value", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "vertical", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "last" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_node_status_allocatable{cluster=~\"$cluster\", resource=\"cpu\", unit=\"core\"})", + "instant": true, + "interval": "", + "legendFormat": "Total Cores", + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum (irate(container_cpu_usage_seconds_total{cluster=~\"$cluster\", id=\"/\"}[2m]))", + "instant": true, + "interval": "", + "legendFormat": "Usage", + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"cpu\", unit=\"core\"})", + "instant": true, + "interval": "", + "legendFormat": "Requests", + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"cpu\", unit=\"core\"})", + "instant": true, + "interval": "", + "legendFormat": "Limit", + "refId": "B" + } + ], + "title": "Node CPU Number of cores", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 15, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "bytes" + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "Total Memory" + }, + "properties": [ + { + "id": "color", + "value": { + "fixedColor": "red", + "mode": "fixed" + } + }, + { + "id": "custom.lineWidth", + "value": 2 + } + ] + } + ] + }, + "gridPos": { + "h": 6, + "w": 12, + "x": 0, + "y": 45 + }, + "id": 88, + "options": { + "legend": { + "calcs": [], + "displayMode": "list", + "placement": "bottom", + "showLegend": false + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_node_status_allocatable{cluster=~\"$cluster\", resource=\"memory\", unit=\"byte\"})", + "instant": false, + "interval": "", + "legendFormat": "Total Memory", + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum (container_memory_working_set_bytes{cluster=~\"$cluster\", container!=\"\"})", + "instant": false, + "interval": "", + "legendFormat": "Usage", + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"memory\", unit=\"byte\"})", + "hide": true, + "instant": false, + "interval": "", + "legendFormat": "Requests", + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"memory\", unit=\"byte\"})", + "hide": true, + "instant": false, + "interval": "", + "legendFormat": "Limit", + "refId": "B" + } + ], + "title": "Memory Usage", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 15, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "none" + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "Total Cores" + }, + "properties": [ + { + "id": "color", + "value": { + "fixedColor": "red", + "mode": "fixed" + } + }, + { + "id": "custom.lineWidth", + "value": 2 + } + ] + } + ] + }, + "gridPos": { + "h": 6, + "w": 12, + "x": 12, + "y": 45 + }, + "id": 89, + "options": { + "legend": { + "calcs": [], + "displayMode": "list", + "placement": "bottom", + "showLegend": false + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_node_status_allocatable{cluster=~\"$cluster\", resource=\"cpu\", unit=\"core\"})", + "instant": false, + "interval": "", + "legendFormat": "Total Cores", + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum (irate(container_cpu_usage_seconds_total{cluster=~\"$cluster\", id=\"/\"}[2m]))", + "instant": false, + "interval": "", + "legendFormat": "Usage", + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"cpu\", unit=\"core\"})", + "hide": true, + "instant": false, + "interval": "", + "legendFormat": "Requests", + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"cpu\", unit=\"core\"})", + "hide": true, + "instant": true, + "interval": "", + "legendFormat": "Limit", + "refId": "B" + } + ], + "title": "CPU Used Cores", + "type": "timeseries" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 51 + }, + "id": 79, + "panels": [], + "title": "Cluster Resource Count", + "type": "row" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green" + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/Anomaly.*/" + }, + "properties": [ + { + "id": "color", + "value": { + "fixedColor": "red", + "mode": "fixed" + } + } + ] + } + ] + }, + "gridPos": { + "h": 2, + "w": 24, + "x": 0, + "y": 52 + }, + "id": 81, + "maxPerRow": 2, + "options": { + "colorMode": "background", + "graphMode": "none", + "justifyMode": "center", + "orientation": "auto", + "reduceOptions": { + "calcs": [ + "last" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "text": {}, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "10.4.3", + "repeat": "origin_prometheus", + "repeatDirection": "v", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "count({cluster=~\"$cluster\", __name__=~\"kube_deployment_metadata_generation|kube_daemonset_metadata_generation|kube_statefulset_metadata_generation\",})", + "hide": false, + "instant": true, + "legendFormat": "Workload", + "range": false, + "refId": "F" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "count(kube_pod_info{cluster=~\"$cluster\", })", + "hide": false, + "instant": true, + "legendFormat": "Total Pod", + "range": false, + "refId": "E" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "count by(key)(kube_node_spec_taint{cluster=~\"$cluster\", key=~\"node.kubernetes.io.*\"})", + "format": "time_series", + "hide": false, + "instant": true, + "legendFormat": "{{key}}", + "range": false, + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "count by(origin_prometheus)(kube_node_info{cluster=~\"$cluster\", })", + "hide": false, + "instant": true, + "legendFormat": "Total Nodes", + "range": false, + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "count by(origin_prometheus)(kube_node_info{cluster=~\"$cluster\", }) - count by(origin_prometheus)(kube_node_spec_taint{key!~\"node.kubernetes.io.*\"})", + "hide": false, + "instant": true, + "legendFormat": "Normal Node", + "range": false, + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "count by(key)(kube_node_spec_taint{cluster=~\"$cluster\", key!~\"node.kubernetes.io.*\"})", + "hide": false, + "instant": true, + "legendFormat": "{{key}}", + "range": false, + "refId": "A" + } + ], + "title": "", + "transformations": [ + { + "id": "renameByRegex", + "options": { + "regex": "(node.kubernetes.io/)(.*)", + "renamePattern": "Abnormal:$2" + } + } + ], + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 25, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineWidth": 2, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "short" + }, + "overrides": [] + }, + "gridPos": { + "h": 11, + "w": 24, + "x": 0, + "y": 54 + }, + "id": 80, + "options": { + "legend": { + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true, + "sortBy": "Max", + "sortDesc": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_pod_info{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Running Pods", + "range": true, + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_service_info{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Services", + "range": true, + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_ingress_info{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Ingresses", + "range": true, + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_deployment_labels{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Deployments", + "range": true, + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_statefulset_labels{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Statefulsets", + "range": true, + "refId": "E" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_daemonset_labels{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Daemonsets", + "range": true, + "refId": "F" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_persistentvolumeclaim_info{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Persistent Volume Claims", + "range": true, + "refId": "G" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_hpa_labels{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Horizontal Pod Autoscalers", + "range": true, + "refId": "H" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_configmap_info{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Configmaps", + "range": true, + "refId": "I" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_secret_info{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Secrets", + "range": true, + "refId": "J" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_networkpolicy_labels{cluster=~\"$cluster\", })", + "interval": "", + "legendFormat": "Network Policies ", + "range": true, + "refId": "K" + } + ], + "title": "Kubernetes Resource Count - Total", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 25, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineWidth": 2, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "short" + }, + "overrides": [] + }, + "gridPos": { + "h": 12, + "w": 24, + "x": 0, + "y": 65 + }, + "id": 118, + "options": { + "legend": { + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true, + "sortBy": "Max", + "sortDesc": true + }, + "tooltip": { + "hideZeros": false, + "maxHeight": 600, + "mode": "multi", + "sort": "none" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(kube_pod_status_qos_class{cluster=~\"$cluster\", }) by (qos_class)", + "interval": "", + "legendFormat": "{{ qos_class }} pods", + "range": true, + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_pod_info{cluster=~\"$cluster\", })", + "hide": false, + "legendFormat": "Total pods", + "range": true, + "refId": "B" + } + ], + "title": "Kubernetes Pods QoS classes", + "type": "timeseries" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 77 + }, + "id": 27, + "panels": [], + "title": "Nodes", + "type": "row" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "This table shows health status of nodes.", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "mappings": [ + { + "options": { + "0": { + "index": 1, + "text": "OK" + }, + "1": { + "index": 0, + "text": "BAD" + } + }, + "type": "value" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "transparent", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + } + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "Unschedulable" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + } + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "Not Ready" }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "rgba(237, 129, 40, 0.89)", - "value": 1 - }, - { - "color": "#d44a3a", - "value": 3 - } - ] - }, - "unit": "none" - }, - "overrides": [] + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Disk Pressure " }, - "gridPos": { - "h": 2, - "w": 4, - "x": 4, - "y": 3 + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Memory Pressure" }, - "id": 32, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "PID Pressure" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "mode": "gradient", + "type": "color-background" + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Network Unavailable" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + } + ] + } + ] + }, + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 78 + }, + "id": 39, + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "editorMode": "code", + "expr": "sum(kube_node_spec_unschedulable{cluster=~\"$cluster\"}) by (node)", + "format": "table", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"Ready\",status!=\"true\"}) by (node)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"DiskPressure\", status!=\"false\"}) by (node)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"MemoryPressure\", status!=\"false\"}) by (node)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"PIDPressure\", status!=\"false\"}) by (node)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "E" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_node_status_condition{cluster=~\"$cluster\", condition=\"NetworkUnavailable\", status!=\"false\"}) by (node)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "F" + } + ], + "title": "Health Status by Node", + "transformations": [ + { + "id": "groupBy", + "options": { + "fields": { + "Value": { + "aggregations": [ "lastNotNull" ], - "fields": "", - "values": false + "operation": "aggregate" }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_node_spec_unschedulable)", - "format": "time_series", - "interval": "", - "intervalFactor": 1, - "legendFormat": "", - "range": true, - "refId": "A" - } - ], - "title": "Node Unschedulable", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "This is true if there is insufficient memory on the node, which could cause the node to swap frequently.", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "rgba(237, 129, 40, 0.89)", - "value": 1 - }, - { - "color": "#d44a3a" - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 4, - "x": 8, - "y": 3 - }, - "id": 36, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ + "Value #A": { + "aggregations": [ "lastNotNull" ], - "fields": "", - "values": false + "operation": "aggregate" }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"MemoryPressure\", status!=\"false\"})", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "Memory Pressure", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "This condition is true if there is insufficient disk space on the node.", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "rgba(237, 129, 40, 0.89)", - "value": 1 - }, - { - "color": "#d44a3a" - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 4, - "x": 12, - "y": 3 - }, - "id": 34, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ + "Value #B": { + "aggregations": [ "lastNotNull" ], - "fields": "", - "values": false + "operation": "aggregate" }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"DiskPressure\", status!=\"false\"})", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "Disk Pressure", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "True when there are too many processes running on the node, indicating a potential exhaustion of process identifiers (PIDs).", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "rgba(237, 129, 40, 0.89)", - "value": 1 - }, - { - "color": "#d44a3a" - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 4, - "x": 16, - "y": 3 - }, - "id": 37, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ + "Value #C": { + "aggregations": [ "lastNotNull" ], - "fields": "", - "values": false + "operation": "aggregate" }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"PIDPressure\", status!=\"false\"})", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "PID Pressure", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Indicates that the network to the node is not correctly configured or not available.", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "rgba(237, 129, 40, 0.89)", - "value": 1 - }, - { - "color": "#d44a3a" - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 4, - "x": 20, - "y": 3 - }, - "id": 35, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ + "Value #D": { + "aggregations": [ "lastNotNull" ], - "fields": "", - "values": false + "operation": "aggregate" }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"NetworkUnavailable\", status!=\"false\"})", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "Network Unavailable", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "text": "N/A" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "rgba(237, 129, 40, 0.89)", - "value": 1 - }, - { - "color": "#d44a3a", - "value": 3 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 4, - "x": 4, - "y": 5 - }, - "id": 33, - "maxDataPoints": 100, - "options": { - "colorMode": "value", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ + "Value #E": { + "aggregations": [ "lastNotNull" ], - "fields": "", - "values": false + "operation": "aggregate" }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"Ready\",status!=\"true\"})", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" - } - ], - "title": "Node Not Ready", - "type": "stat" - }, - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 24, - "x": 0, - "y": 7 - }, - "id": 111, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

Pods

\n
\n", - "mode": "html" - }, - "pluginVersion": "10.4.3", - "title": "", - "type": "text" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Last 15Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "rgba(237, 129, 40, 0.89)", - "value": 1 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 8, - "x": 0, - "y": 9 - }, - "id": 51, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ + "Value #F": { + "aggregations": [ "lastNotNull" ], - "fields": "", - "values": false + "operation": "aggregate" }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(increase(kube_pod_status_phase{phase=\"Failed\"}[15m]))", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" + "node": { + "aggregations": [], + "operation": "groupby" } - ], - "title": "Failed Pods", - "type": "stat" + } + } + }, + { + "id": "merge", + "options": {} + }, + { + "id": "organize", + "options": { + "excludeByName": {}, + "indexByName": {}, + "renameByName": { + "Value #A (lastNotNull)": "Unschedulable", + "Value #B (lastNotNull)": "Not Ready", + "Value #C (lastNotNull)": "Disk Pressure ", + "Value #D (lastNotNull)": "Memory Pressure", + "Value #E (lastNotNull)": "PID Pressure", + "Value #F (lastNotNull)": "Network Unavailable", + "node": "Node" + } + } + } + ], + "type": "table" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "custom": { + "align": "center", + "cellOptions": { + "type": "auto" }, - "description": "Indicates that there are pods that were evicted", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { + "filterable": false, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": ".*%" + }, + "properties": [ + { + "id": "unit", + "value": "percentunit" + }, + { + "id": "thresholds", + "value": { "mode": "absolute", "steps": [ { - "color": "#299c46" - }, - { - "color": "red", - "value": 1 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 16, - "x": 8, - "y": 9 - }, - "id": 102, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(increase(kube_pod_status_reason[15m])) by (reason)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "__auto", - "range": true, - "refId": "A" - } - ], - "title": "Failed Pods Reason", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Last 15Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "red", - "value": 1 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 8, - "x": 0, - "y": 13 - }, - "id": 53, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(increase(kube_pod_status_scheduled{condition=\"false\"}[15m]))", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "Unscheduled Pods", - "type": "stat" - }, - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 24, - "x": 0, - "y": 17 - }, - "id": 112, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

Containers

\n
\n", - "mode": "html" - }, - "pluginVersion": "10.4.3", - "title": "", - "type": "text" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Last 15Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "red", - "value": 1 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 4, - "x": 0, - "y": 19 - }, - "id": 105, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(increase(kube_pod_container_status_waiting_reason{reason=\"CrashLoopBackOff\"}[15m]))", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "CrashLoopBackOff", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Last 15Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "red", - "value": 1 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 4, - "x": 4, - "y": 19 - }, - "id": 106, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(increase(kube_pod_container_status_waiting_reason{reason=\"ErrImagePull\"}[15m]))", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "ErrImagePull", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Last 15Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "red", - "value": 1 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 4, - "x": 8, - "y": 19 - }, - "id": 107, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(increase(kube_pod_container_status_waiting_reason{reason=\"ImagePullBackOff\"}[15m]))", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "ImagePullBackOff", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" - }, - { - "color": "red", - "value": 1 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 6, - "x": 12, - "y": 19 - }, - "id": 108, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "kube_pod_container_status_last_terminated_reason{reason=\"OOMKilled\"} == 1", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "OOM Killed Containers", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Last 15Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "color": "#299c46", - "text": "0" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "#299c46" + "color": "green", + "value": 0 }, { "color": "orange", - "value": 1 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 6, - "x": 18, - "y": 19 - }, - "id": 127, - "maxDataPoints": 100, - "options": { - "colorMode": "background", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "horizontal", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "count(sum(rate(container_cpu_cfs_throttled_seconds_total[15m])) by (pod) > 0)", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "Containers in CPU Throttling", - "type": "stat" - }, - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 24, - "x": 0, - "y": 23 - }, - "id": 113, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

Persistent Volume Claims

\n
\n", - "mode": "html" - }, - "pluginVersion": "10.4.3", - "title": "", - "type": "text" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [], - "noValue": "--", - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "semi-dark-red" - }, - { - "color": "green", - "value": -0.0001 - }, - { - "color": "semi-dark-red", - "value": 0.0001 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 12, - "x": 0, - "y": 25 - }, - "id": 60, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "mean" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "count (max by (persistentvolumeclaim,namespace) (kubelet_volume_stats_used_bytes{} ) and (max by (persistentvolumeclaim,namespace) (kubelet_volume_stats_used_bytes{} )) / (max by (persistentvolumeclaim,namespace) (kubelet_volume_stats_capacity_bytes{} )) >= (80 / 100)) or vector (0)", - "instant": true, - "interval": "", - "legendFormat": "", - "refId": "A" - } - ], - "title": "PVCs Above 80%", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [], - "noValue": "--", - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "semi-dark-red" - }, - { - "color": "green", - "value": -0.0001 - }, - { - "color": "semi-dark-red", - "value": 0.0001 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 4, - "w": 12, - "x": 12, - "y": 25 - }, - "id": 114, - "options": { - "colorMode": "background", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "mean" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_persistentvolumeclaim_status_phase{phase=\"Lost\"})", - "instant": true, - "interval": "", - "legendFormat": "", - "refId": "A" - } - ], - "title": "PVCs in Lost State", - "type": "stat" - } - ], - "title": "Cluster Health", - "type": "row" - }, - { - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 1 - }, - "id": 6, - "panels": [], - "title": "Global", - "type": "row" - }, - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 12, - "x": 0, - "y": 2 - }, - "id": 91, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

Memory Information

\n
\n", - "mode": "html" - }, - "pluginVersion": "11.4.0", - "title": "", - "type": "text" - }, - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 12, - "x": 12, - "y": 2 - }, - "id": 90, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

CPU Information

\n
\n", - "mode": "html" - }, - "pluginVersion": "11.4.0", - "title": "", - "type": "text" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "decimals": 1, - "mappings": [], - "max": 1, - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "orange", - "value": 0.65 - }, - { - "color": "red", - "value": 0.8 - } - ] - }, - "unit": "percentunit" - }, - "overrides": [] - }, - "gridPos": { - "h": 7, - "w": 12, - "x": 0, - "y": 4 - }, - "id": 83, - "options": { - "displayMode": "lcd", - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": false - }, - "maxVizHeight": 300, - "minVizHeight": 16, - "minVizWidth": 8, - "namePlacement": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "last" - ], - "fields": "", - "values": false - }, - "showUnfilled": true, - "sizing": "auto", - "valueMode": "color" - }, - "pluginVersion": "11.4.0", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(container_memory_working_set_bytes{container!=\"\"}) / sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})", - "format": "time_series", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "Real", - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\", unit=\"byte\"}) / sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})", - "format": "time_series", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "Requests", - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_limits{resource=\"memory\", unit=\"byte\"}) / sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})", - "format": "time_series", - "hide": false, - "instant": true, - "interval": "", - "intervalFactor": 1, - "legendFormat": "Limits", - "refId": "B", - "step": 10 - } - ], - "title": "Node Memory Ratio", - "type": "bargauge" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "decimals": 1, - "mappings": [], - "max": 1, - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "orange", - "value": 0.65 - }, - { - "color": "red", - "value": 0.8 - } - ] - }, - "unit": "percentunit" - }, - "overrides": [] - }, - "gridPos": { - "h": 7, - "w": 12, - "x": 12, - "y": 4 - }, - "id": 82, - "options": { - "displayMode": "lcd", - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": false - }, - "maxVizHeight": 300, - "minVizHeight": 10, - "minVizWidth": 0, - "namePlacement": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "last" - ], - "fields": "", - "values": false - }, - "showUnfilled": false, - "sizing": "auto", - "text": {}, - "valueMode": "color" - }, - "pluginVersion": "11.4.0", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum (irate(container_cpu_usage_seconds_total{container!=\"\"}[2m])) / sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})", - "format": "time_series", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "Real", - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\", unit=\"core\"}) / sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})", - "format": "time_series", - "instant": true, - "interval": "", - "legendFormat": "Requests", - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_limits{resource=\"cpu\", unit=\"core\"}) / sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})", - "format": "time_series", - "instant": true, - "interval": "", - "legendFormat": "Limits", - "refId": "B" - } - ], - "title": "Node CPU Ratio", - "type": "bargauge" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "decimals": 1, - "mappings": [], - "max": 2000000000000, - "min": 1, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "text", - "value": null - } - ] - }, - "unit": "bytes" - }, - "overrides": [] - }, - "gridPos": { - "h": 6, - "w": 12, - "x": 0, - "y": 11 - }, - "id": 84, - "options": { - "colorMode": "value", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "vertical", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "last" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "11.4.0", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})", - "instant": true, - "interval": "", - "legendFormat": "Total Memory", - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum (container_memory_working_set_bytes{container!=\"\"})", - "instant": true, - "interval": "", - "legendFormat": "Usage", - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\", unit=\"byte\"})", - "instant": true, - "interval": "", - "legendFormat": "Requests", - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_limits{resource=\"memory\", unit=\"byte\"})", - "instant": true, - "interval": "", - "legendFormat": "Limits", - "refId": "B" - } - ], - "title": "Node Memory Information", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "decimals": 1, - "mappings": [], - "max": 500, - "min": 1, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "text", - "value": null - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 6, - "w": 12, - "x": 12, - "y": 11 - }, - "id": 85, - "options": { - "colorMode": "value", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "vertical", - "percentChangeColorMode": "standard", - "reduceOptions": { - "calcs": [ - "last" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "11.4.0", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})", - "instant": true, - "interval": "", - "legendFormat": "Total Cores", - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum (irate(container_cpu_usage_seconds_total{id=\"/\"}[2m]))", - "instant": true, - "interval": "", - "legendFormat": "Usage", - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\", unit=\"core\"})", - "instant": true, - "interval": "", - "legendFormat": "Requests", - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_limits{resource=\"cpu\", unit=\"core\"})", - "instant": true, - "interval": "", - "legendFormat": "Limit", - "refId": "B" - } - ], - "title": "Node CPU Number of cores", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "barWidthFactor": 0.6, - "drawStyle": "line", - "fillOpacity": 15, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "bytes" - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "Total Memory" - }, - "properties": [ - { - "id": "color", - "value": { - "fixedColor": "red", - "mode": "fixed" - } - }, - { - "id": "custom.lineWidth", - "value": 2 - } - ] - } - ] - }, - "gridPos": { - "h": 6, - "w": 12, - "x": 0, - "y": 17 - }, - "id": 88, - "options": { - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": false - }, - "tooltip": { - "hideZeros": false, - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "11.4.0", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})", - "instant": false, - "interval": "", - "legendFormat": "Total Memory", - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum (container_memory_working_set_bytes{container!=\"\"})", - "instant": false, - "interval": "", - "legendFormat": "Usage", - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\", unit=\"byte\"})", - "hide": true, - "instant": false, - "interval": "", - "legendFormat": "Requests", - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_limits{resource=\"memory\", unit=\"byte\"})", - "hide": true, - "instant": false, - "interval": "", - "legendFormat": "Limit", - "refId": "B" - } - ], - "title": "Memory Usage", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "barWidthFactor": 0.6, - "drawStyle": "line", - "fillOpacity": 15, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "none" - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "Total Cores" - }, - "properties": [ - { - "id": "color", - "value": { - "fixedColor": "red", - "mode": "fixed" - } - }, - { - "id": "custom.lineWidth", - "value": 2 - } - ] - } - ] - }, - "gridPos": { - "h": 6, - "w": 12, - "x": 12, - "y": 17 - }, - "id": 89, - "options": { - "legend": { - "calcs": [], - "displayMode": "list", - "placement": "bottom", - "showLegend": false - }, - "tooltip": { - "hideZeros": false, - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "11.4.0", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})", - "instant": false, - "interval": "", - "legendFormat": "Total Cores", - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum (irate(container_cpu_usage_seconds_total{id=\"/\"}[2m]))", - "instant": false, - "interval": "", - "legendFormat": "Usage", - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\", unit=\"core\"})", - "hide": true, - "instant": false, - "interval": "", - "legendFormat": "Requests", - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_container_resource_limits{resource=\"cpu\", unit=\"core\"})", - "hide": true, - "instant": true, - "interval": "", - "legendFormat": "Limit", - "refId": "B" - } - ], - "title": "CPU Used Cores", - "type": "timeseries" - }, - { - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 23 - }, - "id": 79, - "panels": [], - "title": "Cluster Resource Count", - "type": "row" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [ - { - "matcher": { - "id": "byRegexp", - "options": "/Anomaly.*/" - }, - "properties": [ - { - "id": "color", - "value": { - "fixedColor": "red", - "mode": "fixed" - } - } - ] - } - ] - }, - "gridPos": { - "h": 2, - "w": 24, - "x": 0, - "y": 24 - }, - "id": 81, - "maxPerRow": 2, - "options": { - "colorMode": "background", - "graphMode": "none", - "justifyMode": "center", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "last" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "text": {}, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "repeat": "origin_prometheus", - "repeatDirection": "v", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "count({__name__=~\"kube_deployment_metadata_generation|kube_daemonset_metadata_generation|kube_statefulset_metadata_generation\",})", - "hide": false, - "instant": true, - "legendFormat": "Workload", - "range": false, - "refId": "F" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "count(kube_pod_info{})", - "hide": false, - "instant": true, - "legendFormat": "Total Pod", - "range": false, - "refId": "E" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "count by(key)(kube_node_spec_taint{key=~\"node.kubernetes.io.*\"})", - "format": "time_series", - "hide": false, - "instant": true, - "legendFormat": "{{key}}", - "range": false, - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "count by(origin_prometheus)(kube_node_info{})", - "hide": false, - "instant": true, - "legendFormat": "Total Nodes", - "range": false, - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "count by(origin_prometheus)(kube_node_info{}) - count by(origin_prometheus)(kube_node_spec_taint{key!~\"node.kubernetes.io.*\"})", - "hide": false, - "instant": true, - "legendFormat": "Normal Node", - "range": false, - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "count by(key)(kube_node_spec_taint{key!~\"node.kubernetes.io.*\"})", - "hide": false, - "instant": true, - "legendFormat": "{{key}}", - "range": false, - "refId": "A" - } - ], - "title": "", - "transformations": [ - { - "id": "renameByRegex", - "options": { - "regex": "(node.kubernetes.io/)(.*)", - "renamePattern": "Abnormal:$2" - } - } - ], - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "barWidthFactor": 0.6, - "drawStyle": "line", - "fillOpacity": 25, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineWidth": 2, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green", - "value": null - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "short" - }, - "overrides": [] - }, - "gridPos": { - "h": 11, - "w": 24, - "x": 0, - "y": 26 - }, - "id": 80, - "options": { - "legend": { - "calcs": [ - "lastNotNull" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true, - "sortBy": "Max", - "sortDesc": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "11.4.0", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_pod_info{})", - "interval": "", - "legendFormat": "Running Pods", - "range": true, - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_service_info{})", - "interval": "", - "legendFormat": "Services", - "range": true, - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_ingress_info{})", - "interval": "", - "legendFormat": "Ingresses", - "range": true, - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_deployment_labels{})", - "interval": "", - "legendFormat": "Deployments", - "range": true, - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_statefulset_labels{})", - "interval": "", - "legendFormat": "Statefulsets", - "range": true, - "refId": "E" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_daemonset_labels{})", - "interval": "", - "legendFormat": "Daemonsets", - "range": true, - "refId": "F" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_persistentvolumeclaim_info{})", - "interval": "", - "legendFormat": "Persistent Volume Claims", - "range": true, - "refId": "G" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_hpa_labels{})", - "interval": "", - "legendFormat": "Horizontal Pod Autoscalers", - "range": true, - "refId": "H" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_configmap_info{})", - "interval": "", - "legendFormat": "Configmaps", - "range": true, - "refId": "I" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_secret_info{})", - "interval": "", - "legendFormat": "Secrets", - "range": true, - "refId": "J" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_networkpolicy_labels{})", - "interval": "", - "legendFormat": "Network Policies ", - "range": true, - "refId": "K" - } - ], - "title": "Kubernetes Resource Count - Total", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 25, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineWidth": 2, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "short" - }, - "overrides": [] - }, - "gridPos": { - "h": 12, - "w": 24, - "x": 0, - "y": 37 - }, - "id": 118, - "options": { - "legend": { - "calcs": [ - "lastNotNull" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true, - "sortBy": "Max", - "sortDesc": true - }, - "tooltip": { - "maxHeight": 600, - "mode": "multi", - "sort": "none" - } - }, - "pluginVersion": "8.3.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(kube_pod_status_qos_class{}) by (qos_class)", - "interval": "", - "legendFormat": "{{ qos_class }} pods", - "range": true, - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_pod_info{})", - "hide": false, - "legendFormat": "Total pods", - "range": true, - "refId": "B" - } - ], - "title": "Kubernetes Pods QoS classes", - "type": "timeseries" - }, - { - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 49 - }, - "id": 27, - "panels": [], - "title": "Nodes", - "type": "row" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "This table shows health status of nodes.", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "inspect": false - }, - "mappings": [ - { - "options": { - "0": { - "index": 1, - "text": "OK" - }, - "1": { - "index": 0, - "text": "BAD" - } - }, - "type": "value" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "transparent" - }, - { - "color": "red", - "value": 1 - } - ] - } - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "Unschedulable" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Not Ready" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Disk Pressure " - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Memory Pressure" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "PID Pressure" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "mode": "gradient", - "type": "color-background" - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Network Unavailable" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - } - ] - } - ] - }, - "gridPos": { - "h": 10, - "w": 24, - "x": 0, - "y": 50 - }, - "id": 39, - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "prometheus" - }, - "editorMode": "code", - "expr": "sum(kube_node_spec_unschedulable) by (node)", - "format": "table", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"Ready\",status!=\"true\"}) by (node)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"DiskPressure\", status!=\"false\"}) by (node)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"MemoryPressure\", status!=\"false\"}) by (node)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"PIDPressure\", status!=\"false\"}) by (node)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "E" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_node_status_condition{condition=\"NetworkUnavailable\", status!=\"false\"}) by (node)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "F" - } - ], - "title": "Health Status by Node", - "transformations": [ - { - "id": "groupBy", - "options": { - "fields": { - "Value": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #A": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #B": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #C": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #D": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #E": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #F": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "node": { - "aggregations": [], - "operation": "groupby" - } - } - } - }, - { - "id": "merge", - "options": {} - }, - { - "id": "organize", - "options": { - "excludeByName": {}, - "indexByName": {}, - "renameByName": { - "Value #A (lastNotNull)": "Unschedulable", - "Value #B (lastNotNull)": "Not Ready", - "Value #C (lastNotNull)": "Disk Pressure ", - "Value #D (lastNotNull)": "Memory Pressure", - "Value #E (lastNotNull)": "PID Pressure", - "Value #F (lastNotNull)": "Network Unavailable", - "node": "Node" - } - } - } - ], - "type": "table" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "center", - "cellOptions": { - "type": "auto" - }, - "filterable": false, - "inspect": false - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [ - { - "matcher": { - "id": "byRegexp", - "options": ".*%" - }, - "properties": [ - { - "id": "unit", - "value": "percentunit" - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "orange", - "value": 0.65 - }, - { - "color": "red", - "value": 0.8 - } - ] - } - }, - { - "id": "custom.cellOptions", - "value": { - "mode": "gradient", - "type": "color-background" - } - } - ] - }, - { - "matcher": { - "id": "byRegexp", - "options": "(mem total|mem req|mem limit)" - }, - "properties": [ - { - "id": "unit", - "value": "bytes" - }, - { - "id": "decimals", - "value": 2 - } - ] - }, - { - "matcher": { - "id": "byRegexp", - "options": ".*(total|capacity)" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-text" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "blue" - } - ] - } - } - ] - }, - { - "matcher": { - "id": "byType", - "options": "number" - }, - "properties": [ - { - "id": "custom.width", - "value": 120 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "statut" - }, - "properties": [ - { - "id": "custom.width", - "value": 100 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "pod" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "mode": "gradient", - "type": "color-background" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "#EAB839", - "value": 150 - }, - { - "color": "red", - "value": 200 - } - ] - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "mem limit" - }, - "properties": [ - { - "id": "custom.width" - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Node" - }, - "properties": [ - { - "id": "custom.width", - "value": 234 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "status" - }, - "properties": [ - { - "id": "custom.width", - "value": 78 - } - ] - } - ] - }, - "gridPos": { - "h": 13, - "w": 24, - "x": 0, - "y": 60 - }, - "id": 117, - "interval": "30s", - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true, - "sortBy": [ - { - "desc": true, - "displayName": "cpu limit%" - } - ] - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "kube_node_status_condition{status=\"true\"} == 1", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "status", - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum (rate (container_cpu_usage_seconds_total{id=\"/\"}[3m])) by (node)", - "format": "table", - "hide": true, - "instant": true, - "interval": "", - "legendFormat": "node cpu used", - "refId": "I" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "kube_node_status_capacity{resource=\"cpu\"} - 0", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "node cpu capacity", - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\"}) by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "pod cpu request total", - "refId": "E" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_pod_container_resource_limits{resource=\"cpu\"}) by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "pod cpu limit total", - "refId": "F" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum (container_memory_working_set_bytes{id=\"/\"}) by (node)", - "format": "table", - "hide": true, - "instant": true, - "interval": "", - "legendFormat": "container mem used total", - "refId": "J" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "kube_node_status_capacity{resource=\"memory\"} - 0", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "node mem available total", - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\"}) by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "pod mem request total", - "refId": "G" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_pod_container_resource_limits{resource=\"memory\"}) by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "pod mem limit total", - "refId": "H" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum (container_fs_usage_bytes{device=~\"^/dev/.*$\",id=\"/\"}) by (node)", - "format": "table", - "hide": true, - "instant": true, - "interval": "", - "legendFormat": "container fs used total", - "refId": "K" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum (container_fs_limit_bytes{device=~\"^/dev/.*$\",id=\"/\"}) by (node)", - "format": "table", - "hide": true, - "instant": true, - "interval": "", - "legendFormat": "container fs limit total", - "refId": "L" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum (container_memory_working_set_bytes{id=\"/\"})by (node) / sum (machine_memory_bytes{})by (node)", - "format": "table", - "hide": true, - "instant": true, - "interval": "", - "legendFormat": "container mem used%", - "refId": "M" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_pod_container_resource_requests{resource=\"memory\"})by (node) / sum(kube_node_status_capacity{resource=\"memory\"})by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "pod mem request %", - "refId": "N" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_pod_container_resource_limits{resource=\"memory\"})by (node) / sum(kube_node_status_capacity{resource=\"memory\"})by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "pod mem limit %", - "refId": "O" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum (rate (container_cpu_usage_seconds_total{id=\"/\"}[2m]))by (node) / sum (machine_cpu_cores{})by (node)", - "format": "table", - "hide": true, - "instant": true, - "interval": "", - "legendFormat": "container cpu used %", - "refId": "P" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_pod_container_resource_requests{resource=\"cpu\"})by (node) / sum(kube_node_status_allocatable{resource=\"cpu\"})by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "pod cpu request %", - "refId": "Q" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_pod_container_resource_limits{resource=\"cpu\"})by (node) / sum(kube_node_status_allocatable{resource=\"cpu\"})by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "pod cpu limit %", - "refId": "R" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum (container_fs_usage_bytes{device=~\"^/dev/.*$\",id=\"/\"})by (node) / sum (container_fs_limit_bytes{device=~\"^/dev/.*$\",id=\"/\"})by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "container fs used %", - "refId": "S" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "sum(kube_node_status_capacity{resource=\"pods\"})by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "node pod capacity", - "refId": "T" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "count(kube_pod_info{created_by_kind!~\"|Job\"}) by (node)", - "format": "table", - "hide": false, - "instant": true, - "interval": "", - "legendFormat": "running pod", - "refId": "A" - } - ], - "title": "Statistic for node", - "transformations": [ - { - "id": "seriesToColumns", - "options": { - "byField": "node" - } - }, - { - "id": "filterFieldsByName", - "options": { - "include": { - "names": [ - "node", - "condition", - "Value #B", - "Value #C", - "Value #E", - "Value #F", - "Value #D", - "Value #G", - "Value #H", - "Value #N", - "Value #O", - "Value #Q", - "Value #R", - "Value #T", - "Value #A" - ], - "pattern": "(node|condition|Value.*)" - } - } - }, - { - "id": "organize", - "options": { - "excludeByName": { - "Time 1": true, - "Time 10": true, - "Time 11": true, - "Time 12": true, - "Time 13": true, - "Time 14": true, - "Time 15": true, - "Time 16": true, - "Time 17": true, - "Time 18": true, - "Time 19": true, - "Time 2": true, - "Time 20": true, - "Time 3": true, - "Time 4": true, - "Time 5": true, - "Time 6": true, - "Time 7": true, - "Time 8": true, - "Time 9": true, - "Value #B": true, - "Value #E": false, - "Value #F": false, - "__name__": true, - "app_kubernetes_io_name 1": true, - "app_kubernetes_io_name 2": true, - "app_kubernetes_io_name 3": true, - "app_kubernetes_io_version 1": true, - "app_kubernetes_io_version 2": true, - "app_kubernetes_io_version 3": true, - "condition": false, - "instance 1": true, - "instance 2": true, - "instance 3": true, - "job 1": true, - "job 2": true, - "job 3": true, - "k8s_namespace 1": true, - "k8s_namespace 2": true, - "k8s_namespace 3": true, - "k8s_sname 1": true, - "k8s_sname 2": true, - "k8s_sname 3": true, - "origin_prometheus 1": true, - "origin_prometheus 2": true, - "origin_prometheus 3": true, - "status": true - }, - "indexByName": { - "Value #A": 13, - "Value #B": 2, - "Value #C": 3, - "Value #D": 8, - "Value #E": 4, - "Value #F": 6, - "Value #G": 9, - "Value #H": 11, - "Value #N": 10, - "Value #O": 12, - "Value #Q": 5, - "Value #R": 7, - "Value #T": 14, - "condition": 1, - "node": 0 - }, - "renameByName": { - "Value #A": "pod", - "Value #C": "cpu total", - "Value #D": "mem total", - "Value #E": "cpu req", - "Value #F": "cpu limit", - "Value #G": "mem req", - "Value #H": "mem limit", - "Value #I": "cpu used", - "Value #J": "ram used", - "Value #K": "disk used", - "Value #L": "disk total", - "Value #M": "mem used%", - "Value #N": "mem req%", - "Value #O": "mem limit%", - "Value #P": "cpu used%", - "Value #Q": "cpu req%", - "Value #R": "cpu limit%", - "Value #S": "disk used%", - "Value #T": "pod capacity", - "condition": "status", - "node": "Node" - } - } - } - ], - "type": "table" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "percent" - }, - "overrides": [ - { - "matcher": { - "id": "byRegexp", - "options": "/Total number of cores.*/" - }, - "properties": [ - { - "id": "color", - "value": { - "fixedColor": "#C4162A", - "mode": "fixed" - } - } - ] - } - ] - }, - "gridPos": { - "h": 10, - "w": 12, - "x": 0, - "y": 73 - }, - "id": 69, - "options": { - "legend": { - "calcs": [ - "mean", - "lastNotNull", - "max" - ], - "displayMode": "table", - "placement": "bottom", - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "10.4.1", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum (irate(container_cpu_usage_seconds_total{container!=\"\"}[2m])) by (node) / sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\"})by (node)*100 ", - "format": "time_series", - "hide": false, - "instant": false, - "interval": "", - "legendFormat": "{{node}}", - "refId": "I" - } - ], - "title": "Node CPU Usage", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "percent" - }, - "overrides": [] - }, - "gridPos": { - "h": 10, - "w": 12, - "x": 12, - "y": 73 - }, - "id": 70, - "options": { - "legend": { - "calcs": [ - "mean", - "lastNotNull", - "max" - ], - "displayMode": "table", - "placement": "bottom", - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "10.4.1", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum (container_memory_working_set_bytes{container!=\"\"})by (node) / sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\"})by (node)*100", - "format": "time_series", - "hide": false, - "instant": false, - "interval": "", - "legendFormat": "{{node}}", - "refId": "I" - } - ], - "title": "Node Memory Usage", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "The table shows available disk size by mount points. Only mount point that used over 50% are displayed.", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "inspect": false - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "Size" - }, - "properties": [ - { - "id": "unit", - "value": "decbits" - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Available" - }, - "properties": [ - { - "id": "unit", - "value": "decbits" - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Used" - }, - "properties": [ - { - "id": "unit", - "value": "decbits" - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Used (%)" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "gauge" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 0.8 - }, - { - "color": "#EAB839", - "value": 1 - } - ] - } - }, - { - "id": "unit", - "value": "percentunit" - }, - { - "id": "max", - "value": 1 - }, - { - "id": "min", - "value": 0 - } - ] - } - ] - }, - "gridPos": { - "h": 10, - "w": 24, - "x": 0, - "y": 83 - }, - "id": 46, - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true, - "sortBy": [ - { - "desc": true, - "displayName": "Used (%)" - } - ] - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(node_filesystem_free_bytes{fstype!=\"\"}) by (instance, fstype, mountpoint)", - "format": "table", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "max by (instance, fstype, mountpoint) (node_filesystem_size_bytes{job=\"node-exporter\", fstype!=\"\", mountpoint!=\"\"})", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "B" - } - ], - "title": "Disk by Mount Point", - "transformations": [ - { - "id": "groupBy", - "options": { - "fields": { - "Value": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #A": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #B": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "fstype": { - "aggregations": [], - "operation": "groupby" - }, - "instance": { - "aggregations": [], - "operation": "groupby" - }, - "mountpoint": { - "aggregations": [], - "operation": "groupby" - } - } - } - }, - { - "id": "merge", - "options": {} - }, - { - "id": "organize", - "options": { - "excludeByName": {}, - "indexByName": { - "Value #A (lastNotNull)": 4, - "Value #B (lastNotNull)": 3, - "fstype": 0, - "instance": 1, - "mountpoint": 2 - }, - "renameByName": { - "Value #A (lastNotNull)": "Available", - "Value #B (lastNotNull)": "Size", - "fstype": "FS Type", - "instance": "Instance", - "mountpoint": "Mountpoint" - } - } - }, - { - "id": "calculateField", - "options": { - "alias": "Used", - "binary": { - "left": "Size", - "operator": "-", - "right": "Available" - }, - "mode": "binary", - "reduce": { - "reducer": "sum" - } - } - }, - { - "id": "calculateField", - "options": { - "alias": "Used (%)", - "binary": { - "left": "Used", - "operator": "/", - "right": "Size" - }, - "mode": "binary", - "reduce": { - "reducer": "sum" - } - } - } - ], - "type": "table" - }, - { - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 93 - }, - "id": 20, - "panels": [], - "title": "Namespaces", - "type": "row" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "filterable": false, - "inspect": false - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "Failed Pods" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 1 - } - ] - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Pending Pods" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "orange", - "value": 1 - } - ] - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Unknown Pods" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "orange", - "value": 1 - } - ] - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Unscheduled Pods Last 5min" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 1 - } - ] - } - } - ] - } - ] - }, - "gridPos": { - "h": 8, - "w": 24, - "x": 0, - "y": 94 - }, - "id": 49, - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "enablePagination": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_pod_owner{job=\"kube-state-metrics\"}) by (namespace)", - "format": "table", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "count(avg(namespace_workload_pod:kube_pod_owner:relabel{}) by (workload, namespace)) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_pod_status_phase{phase=\"Failed\"}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_pod_status_phase{phase=\"Unknown\"}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "E" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(avg_over_time(kube_pod_status_scheduled{condition=\"false\"}[5m])) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "F" - } - ], - "title": "Pods Status", - "transformations": [ - { - "id": "groupBy", - "options": { - "fields": { - "Value": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #A": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #B": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #C": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #D": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #E": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #F": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "namespace": { - "aggregations": [], - "operation": "groupby" - } - } - } - }, - { - "id": "merge", - "options": {} - }, - { - "id": "organize", - "options": { - "excludeByName": {}, - "indexByName": {}, - "renameByName": { - "Value #A (lastNotNull)": "Pods", - "Value #B (lastNotNull)": "Workloads", - "Value #C (lastNotNull)": "Failed Pods", - "Value #D (lastNotNull)": "Pending Pods", - "Value #E (lastNotNull)": "Unknown Pods", - "Value #F (lastNotNull)": "Unscheduled Pods Last 5min", - "namespace": "Namespace" - } - } - } - ], - "type": "table" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "inspect": false - }, - "decimals": 2, - "displayName": "", - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "short" - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "CPU Requests (%)" - }, - "properties": [ - { - "id": "custom.align" - }, - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - }, - { - "id": "unit", - "value": "percentunit" - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "orange", - "value": 0.8 - }, - { - "color": "red", - "value": 1 - } - ] - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "CPU Limits (%)" - }, - "properties": [ - { - "id": "unit", - "value": "percentunit" - }, - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "orange", - "value": 0.6 - }, - { - "color": "red", - "value": 0.8 - } - ] - } - } - ] - } - ] - }, - "gridPos": { - "h": 9, - "w": 24, - "x": 0, - "y": 102 - }, - "id": 63, - "interval": "1m", - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{}) by (namespace)", - "format": "table", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(namespace_cpu:kube_pod_container_resource_requests:sum{}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{}) by (namespace) / sum(namespace_cpu:kube_pod_container_resource_requests:sum{}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(namespace_cpu:kube_pod_container_resource_limits:sum{}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{}) by (namespace) / sum(namespace_cpu:kube_pod_container_resource_limits:sum{}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "E" - } - ], - "title": "CPU Information", - "transformations": [ - { - "id": "groupBy", - "options": { - "fields": { - "Value": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #A": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #B": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #C": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #D": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #E": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "namespace": { - "aggregations": [], - "operation": "groupby" - } - } - } - }, - { - "id": "merge", - "options": {} - }, - { - "id": "organize", - "options": { - "excludeByName": {}, - "indexByName": {}, - "renameByName": { - "Value #A (lastNotNull)": "CPU Usage (vCPU)", - "Value #B (lastNotNull)": "CPU Requests (vCPU)", - "Value #C (lastNotNull)": "CPU Requests (%)", - "Value #D (lastNotNull)": "CPU Limits (vCPU)", - "Value #E (lastNotNull)": "CPU Limits (%)", - "namespace": "Namespace" - } - } - } - ], - "type": "table" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "inspect": false - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "bytes" - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "Memory Requests (%)" - }, - "properties": [ - { - "id": "unit", - "value": "percentunit" - }, - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "orange", - "value": 0.8 - }, - { - "color": "red", - "value": 1 - } - ] - } - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Memory Limits (%)" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "type": "color-background" - } - }, - { - "id": "unit", - "value": "percentunit" - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "orange", - "value": 0.6 - }, - { - "color": "red", - "value": 0.8 - } - ] - } - } - ] - } - ] - }, - "gridPos": { - "h": 8, - "w": 24, - "x": 0, - "y": 111 - }, - "id": 64, - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(container_memory_rss{job=\"kubelet\", metrics_path=\"/metrics/cadvisor\", container!=\"\"}) by (namespace)", - "format": "table", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(namespace_memory:kube_pod_container_resource_requests:sum{}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(container_memory_rss{job=\"kubelet\", metrics_path=\"/metrics/cadvisor\", container!=\"\"}) by (namespace) / sum(namespace_memory:kube_pod_container_resource_requests:sum{}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(namespace_memory:kube_pod_container_resource_limits:sum{}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(container_memory_rss{job=\"kubelet\", metrics_path=\"/metrics/cadvisor\", container!=\"\"}) by (namespace) / sum(namespace_memory:kube_pod_container_resource_limits:sum{}) by (namespace)", - "format": "table", - "hide": false, - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "E" - } - ], - "title": "Memory Information", - "transformations": [ - { - "id": "groupBy", - "options": { - "fields": { - "Value #A": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #B": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #C": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #D": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "Value #E": { - "aggregations": [ - "lastNotNull" - ], - "operation": "aggregate" - }, - "namespace": { - "aggregations": [ - "lastNotNull" - ], - "operation": "groupby" - } - } - } - }, - { - "id": "merge", - "options": {} - }, - { - "id": "organize", - "options": { - "excludeByName": {}, - "indexByName": {}, - "renameByName": { - "Value #A (lastNotNull)": "Memory Usage ", - "Value #B (lastNotNull)": "Memory Requests ", - "Value #C (lastNotNull)": "Memory Requests (%)", - "Value #D (lastNotNull)": "Memory Limits", - "Value #E (lastNotNull)": "Memory Limits (%)", - "namespace": "Namespace" - } - } - } - ], - "type": "table" - }, - { - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 119 - }, - "id": 25, - "panels": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 10, - "w": 24, - "x": 0, - "y": 22 - }, - "id": 94, - "interval": "1m", - "options": {}, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "count(namespace_workload_pod:kube_pod_owner:relabel{}) by (workload, workload_type, namespace)", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "A", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "B", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n kube_pod_container_resource_requests{job=\"kube-state-metrics\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "C", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type, namespace)\n/sum(\n kube_pod_container_resource_requests{job=\"kube-state-metrics\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type, namespace)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "D", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n kube_pod_container_resource_limits{job=\"kube-state-metrics\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "E", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_limits{job=\"kube-state-metrics\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "F", - "step": 10 - } - ], - "title": "CPU Information", - "type": "table" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 11, - "w": 24, - "x": 0, - "y": 32 - }, - "id": 48, - "interval": "1m", - "options": {}, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "count(namespace_workload_pod:kube_pod_owner:relabel{}) by (workload, workload_type, namespace)", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "A", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n container_memory_working_set_bytes{job=\"kubelet\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "B", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n kube_pod_container_resource_requests{job=\"kube-state-metrics\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "C", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n container_memory_working_set_bytes{job=\"kubelet\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_requests{job=\"kube-state-metrics\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "D", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n kube_pod_container_resource_limits{job=\"kube-state-metrics\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "E", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(\n container_memory_working_set_bytes{job=\"kubelet\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_limits{job=\"kube-state-metrics\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "F", - "step": 10 - } - ], - "title": "Memory Information", - "type": "table" - } - ], - "title": "Workloads", - "type": "row" - }, - { - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 120 - }, - "id": 72, - "panels": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "fixedColor": "rgb(31, 120, 193)", - "mode": "fixed" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "text": "N/A" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 3, - "w": 8, - "x": 0, - "y": 23 - }, - "id": 73, - "maxDataPoints": 100, - "options": { - "colorMode": "none", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_job_status_succeeded{})", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "Jobs Succeeded", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "inspect": false - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "Time" - }, - "properties": [ - { - "id": "displayName", - "value": "Time" - }, - { - "id": "unit", - "value": "time: YYYY-MM-DD HH:mm:ss" - }, - { - "id": "custom.align" - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Metric" - }, - "properties": [ - { - "id": "displayName", - "value": "Job" - }, - { - "id": "unit", - "value": "short" - }, - { - "id": "decimals", - "value": 2 - }, - { - "id": "custom.align" - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Value" - }, - "properties": [ - { - "id": "displayName", - "value": "Day" - }, - { - "id": "unit", - "value": "none" - }, - { - "id": "decimals", - "value": 4 - }, - { - "id": "custom.align" - } - ] - } - ] - }, - "gridPos": { - "h": 9, - "w": 8, - "x": 8, - "y": 23 - }, - "id": 76, - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true, - "sortBy": [ - { - "desc": false, - "displayName": "Day" - } - ] - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "(time()-kube_job_status_completion_time{})/60/60/24>1", - "format": "time_series", - "instant": true, - "interval": "", - "intervalFactor": 1, - "legendFormat": "{{job_name}}", - "refId": "A" - } - ], - "title": "Last Succeeded Jobs", - "transformations": [ - { - "id": "seriesToRows", - "options": { - "reducers": [] - } - } - ], - "type": "table" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "inspect": false - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 9, - "w": 8, - "x": 16, - "y": 23 - }, - "id": 77, - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "kube_job_status_failed{}>=1", - "format": "time_series", - "instant": true, - "interval": "", - "intervalFactor": 1, - "legendFormat": "{{job_name}}", - "refId": "A" - } - ], - "title": "Failed Jobs", - "transformations": [ - { - "id": "labelsToFields", - "options": { - "keepLabels": [ - "job_name", - "namespace", - "reason" - ] - } - } - ], - "type": "table" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "fixedColor": "rgb(31, 120, 193)", - "mode": "fixed" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "text": "N/A" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 3, - "w": 8, - "x": 0, - "y": 26 - }, - "id": 74, - "maxDataPoints": 100, - "options": { - "colorMode": "none", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_job_status_active{})", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "Jobs Active", - "type": "stat" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "fixedColor": "rgb(31, 120, 193)", - "mode": "fixed" - }, - "mappings": [ - { - "options": { - "match": "null", - "result": { - "text": "N/A" - } - }, - "type": "special" - } - ], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 3, - "w": 8, - "x": 0, - "y": 29 - }, - "id": 75, - "maxDataPoints": 100, - "options": { - "colorMode": "none", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_job_status_failed{})", - "format": "time_series", - "intervalFactor": 1, - "range": true, - "refId": "A" - } - ], - "title": "Jobs Failed", - "type": "stat" - } - ], - "title": "Jobs", - "type": "row" - }, - { - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 121 - }, - "id": 54, - "panels": [ - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 24, - "x": 0, - "y": 24 - }, - "id": 123, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

CPU Information

\n
\n", - "mode": "html" - }, - "pluginVersion": "10.4.3", - "title": "", - "type": "text" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "fixedColor": "orange", - "mode": "continuous-GrYlRd" - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 9, - "w": 24, - "x": 0, - "y": 26 - }, - "id": 120, - "options": { - "displayMode": "gradient", - "maxVizHeight": 300, - "minVizHeight": 16, - "minVizWidth": 8, - "namePlacement": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showUnfilled": true, - "sizing": "auto", - "valueMode": "color" - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "952b8fca-4117-4324-92cc-fba33c458982" - }, - "editorMode": "code", - "exemplar": false, - "expr": "topk(10, sum(rate(container_cpu_usage_seconds_total{container!=\"\"}[5m])) by (pod))", - "instant": true, - "legendFormat": "{{pod}}", - "range": false, - "refId": "A" - } - ], - "title": "Top 10 CPU Consuming Pods", - "type": "bargauge" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "links": [], - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "percent" - }, - "overrides": [] - }, - "gridPos": { - "h": 12, - "w": 24, - "x": 0, - "y": 35 - }, - "id": 93, - "options": { - "legend": { - "calcs": [ - "mean", - "lastNotNull", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "10.4.1", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "max(irate(container_cpu_usage_seconds_total{container !=\"\",container!=\"POD\"}[2m])) by (container, pod, namespace) / (max(container_spec_cpu_quota{container !=\"\",container!=\"POD\"}/100000) by (container, pod, namespace)) * 100", - "hide": false, - "instant": false, - "interval": "", - "intervalFactor": 1, - "legendFormat": "{{ namespace }} / {{ pod }}", - "metric": "container_cpu", - "refId": "A", - "step": 10 - } - ], - "title": "Pod Containers CPU Utilization", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "How many additional CPU was needed for container not to be in CPU Throttling", - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "auto", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [] - }, - "gridPos": { - "h": 13, - "w": 12, - "x": 0, - "y": 47 - }, - "id": 121, - "options": { - "legend": { - "calcs": [ - "lastNotNull", - "mean", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "952b8fca-4117-4324-92cc-fba33c458982" - }, - "editorMode": "code", - "expr": "sum(rate(container_cpu_cfs_throttled_seconds_total{}[5m])) by (namespace,pod) > 0", - "instant": false, - "legendFormat": "{{namespace}} / {{pod}}", - "range": true, - "refId": "A" - } - ], - "title": "CPU Throttling Seconds", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "cpu cores", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 40, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 6, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "links": [], - "mappings": [], - "max": 100, - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "short" - }, - "overrides": [ - { - "matcher": { - "id": "byRegexp", - "options": "/Throttle/" - }, - "properties": [ - { - "id": "unit", - "value": "percent" - }, - { - "id": "custom.axisLabel", - "value": "throttling percent" - } - ] - } - ] - }, - "gridPos": { - "h": 13, - "w": 12, - "x": 12, - "y": 47 - }, - "id": 119, - "options": { - "legend": { - "calcs": [ - "lastNotNull", - "mean", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "none" - } - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "rate(container_cpu_usage_seconds_total{}[1m])", - "legendFormat": "CPU Cores Usage {{namespace}}/{{pod}}/{{container}}", - "range": true, - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum by (namespace,pod,container) ((container_cpu_cfs_throttled_periods_total{} / container_cpu_cfs_periods_total{}) * 100)", - "legendFormat": "Throttle Percent {{namespace}}/{{pod}}/{{container}}", - "range": true, - "refId": "A" - } - ], - "title": "CPU Usage vs Throttling Percent", - "type": "timeseries" - }, - { - "fieldConfig": { - "defaults": {}, - "overrides": [] - }, - "gridPos": { - "h": 2, - "w": 24, - "x": 0, - "y": 60 - }, - "id": 124, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

Memory Information

\n
\n", - "mode": "html" - }, - "pluginVersion": "10.4.3", - "title": "", - "type": "text" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "continuous-GrYlRd" - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - } - ] - }, - "unit": "bytes" - }, - "overrides": [] - }, - "gridPos": { - "h": 10, - "w": 24, - "x": 0, - "y": 62 - }, - "id": 126, - "options": { - "displayMode": "gradient", - "maxVizHeight": 300, - "minVizHeight": 16, - "minVizWidth": 8, - "namePlacement": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showUnfilled": true, - "sizing": "auto", - "valueMode": "color" - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "952b8fca-4117-4324-92cc-fba33c458982" - }, - "editorMode": "code", - "exemplar": false, - "expr": "topk(10,sum(container_memory_working_set_bytes{container!=\"\"}) by (pod))", - "instant": true, - "legendFormat": "__auto", - "range": false, - "refId": "A" - } - ], - "title": "Top 10 Memory Consuming Pods", - "type": "bargauge" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Pods whose Mem usage/Mem limits is more then 65%.", - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "auto", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "dashed" - } - }, - "mappings": [], - "max": 1, - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "orange", - "value": 0.7 + "value": 0.65 }, { "color": "red", "value": 0.8 } ] - }, - "unit": "percentunit" + } }, - "overrides": [] - }, - "gridPos": { - "h": 11, - "w": 24, - "x": 0, - "y": 72 - }, - "id": 122, - "options": { - "legend": { - "calcs": [ - "lastNotNull", - "mean", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "targets": [ { - "datasource": { - "type": "prometheus", - "uid": "952b8fca-4117-4324-92cc-fba33c458982" - }, - "editorMode": "code", - "expr": "sum(container_memory_working_set_bytes{container!=\"\"}) by (namespace,pod) /\r\nsum(kube_pod_container_resource_limits{resource=\"memory\"}) by (namespace,pod) > 0.65", - "instant": false, - "legendFormat": "{{ namespace }} / {{ pod }}", - "range": true, - "refId": "A" + "id": "custom.cellOptions", + "value": { + "mode": "gradient", + "type": "color-background" + } } - ], - "title": "Pods with Potential Mem Leaks", - "type": "timeseries" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byRegexp", + "options": "(mem total|mem req|mem limit)" }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "links": [], - "mappings": [], - "thresholds": { + "properties": [ + { + "id": "unit", + "value": "bytes" + }, + { + "id": "decimals", + "value": 2 + } + ] + }, + { + "matcher": { + "id": "byRegexp", + "options": ".*(total|capacity)" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-text" + } + }, + { + "id": "thresholds", + "value": { "mode": "absolute", "steps": [ { - "color": "green" + "color": "blue", + "value": 0 + } + ] + } + } + ] + }, + { + "matcher": { + "id": "byType", + "options": "number" + }, + "properties": [ + { + "id": "custom.width", + "value": 120 + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "statut" + }, + "properties": [ + { + "id": "custom.width", + "value": 100 + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "pod" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "mode": "gradient", + "type": "color-background" + } + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "#EAB839", + "value": 150 }, { "color": "red", - "value": 80 + "value": 200 } ] - }, - "unit": "percent" - }, - "overrides": [] - }, - "gridPos": { - "h": 11, - "w": 24, - "x": 0, - "y": 83 - }, - "id": 95, - "options": { - "legend": { - "calcs": [ - "max", - "last", - "mean" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" + } } - }, - "pluginVersion": "10.4.1", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "max (container_memory_working_set_bytes{container !=\"\",container!=\"POD\"}) by (namespace,container, pod)/ max(container_spec_memory_limit_bytes{container !=\"\",container!=\"POD\"}) by (namespace,container, pod) * 100", - "interval": "", - "intervalFactor": 1, - "legendFormat": "WSS:{{ namespace }} / {{ pod }}", - "metric": "container_memory_usage:sort_desc", - "range": true, - "refId": "A", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": false, - "expr": "max (container_memory_rss{container !=\"\",container!=\"POD\"}) by (namespace,container, pod)/ max(container_spec_memory_limit_bytes{container !=\"\",container!=\"POD\"}) by (namespace,container, pod) * 100", - "interval": "", - "intervalFactor": 1, - "legendFormat": "RSS:{{ namespace }} / {{ pod }}", - "metric": "container_memory_usage:sort_desc", - "range": true, - "refId": "B", - "step": 10 - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "(cass_jvm_heap{} * on (namespace,pod_ip) group_right(service) kube_pod_info{}) / (cass_jvm_heap_max{} * on (namespace,pod_ip) group_right(service) kube_pod_info{}) * 100", - "hide": true, - "instant": false, - "interval": "", - "intervalFactor": 1, - "legendFormat": "Heap:{{ namespace }} / {{ pod }}", - "metric": "container_memory_usage:sort_desc", - "refId": "C", - "step": 10 - } - ], - "title": "Pod Container Memory Usage", - "type": "timeseries" + ] }, { - "fieldConfig": { - "defaults": {}, - "overrides": [] + "matcher": { + "id": "byName", + "options": "mem limit" }, - "gridPos": { - "h": 2, - "w": 24, - "x": 0, - "y": 94 - }, - "id": 125, - "options": { - "code": { - "language": "plaintext", - "showLineNumbers": false, - "showMiniMap": false - }, - "content": "
\n

Events

\n
\n", - "mode": "html" - }, - "pluginVersion": "10.4.3", - "title": "", - "type": "text" + "properties": [ + { + "id": "custom.width" + } + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "Node" }, - "description": "Last 1h", - "fieldConfig": { - "defaults": { - "color": { - "fixedColor": "blue", - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "Percent", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineStyle": { - "fill": "solid" - }, - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "dashed" - } - }, - "mappings": [], - "max": 40, - "min": 0, - "thresholds": { - "mode": "percentage", - "steps": [ - { - "color": "red" - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 11, - "w": 24, - "x": 0, - "y": 96 - }, - "id": 104, - "options": { - "legend": { - "calcs": [ - "lastNotNull" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true, - "sortBy": "Last *", - "sortDesc": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "8.3.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum by (pod, container) (increase(kube_pod_container_status_restarts_total{container!=\"\"}[1h])) > 1", - "interval": "1h", - "legendFormat": "{{ pod }} / {{ container }}", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 234 } - ], - "title": "Container Restarts", - "type": "timeseries" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "status" }, - "description": "Last 1h", - "fieldConfig": { - "defaults": { - "color": { - "fixedColor": "blue", - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "Percent", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 25, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineStyle": { - "fill": "solid" - }, - "lineWidth": 2, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "dashed" - } - }, - "mappings": [], - "max": 50, - "min": 0, - "thresholds": { - "mode": "percentage", - "steps": [ - { - "color": "red" - } - ] - }, - "unit": "none" - }, - "overrides": [] - }, - "gridPos": { - "h": 12, - "w": 24, - "x": 0, - "y": 107 - }, - "id": 103, - "options": { - "legend": { - "calcs": [ - "lastNotNull" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true, - "sortBy": "Last *", - "sortDesc": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "8.3.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(increase(container_oom_events_total{container!=\"\"}[1h])) by (pod, container) > 0", - "interval": "1h", - "legendFormat": "{{ pod }} / {{ container }}", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 78 } - ], - "title": "OOM Events by Container", - "type": "timeseries" + ] } - ], - "title": "Pods", - "type": "row" + ] }, - { - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 122 + "gridPos": { + "h": 13, + "w": 24, + "x": 0, + "y": 88 + }, + "id": 117, + "interval": "30s", + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false }, - "id": 23, - "panels": [ + "showHeader": true, + "sortBy": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "desc": true, + "displayName": "cpu limit%" + } + ] + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "kube_node_status_condition{cluster=~\"$cluster\", status=\"true\"} == 1", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "status", + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum (rate (container_cpu_usage_seconds_total{cluster=~\"$cluster\", id=\"/\"}[3m])) by (node)", + "format": "table", + "hide": true, + "instant": true, + "interval": "", + "legendFormat": "node cpu used", + "refId": "I" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "kube_node_status_capacity{cluster=~\"$cluster\", resource=\"cpu\"} - 0", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "node cpu capacity", + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"cpu\"}) by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "pod cpu request total", + "refId": "E" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"cpu\"}) by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "pod cpu limit total", + "refId": "F" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum (container_memory_working_set_bytes{cluster=~\"$cluster\", id=\"/\"}) by (node)", + "format": "table", + "hide": true, + "instant": true, + "interval": "", + "legendFormat": "container mem used total", + "refId": "J" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "kube_node_status_capacity{cluster=~\"$cluster\", resource=\"memory\"} - 0", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "node mem available total", + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"memory\"}) by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "pod mem request total", + "refId": "G" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"memory\"}) by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "pod mem limit total", + "refId": "H" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum (container_fs_usage_bytes{cluster=~\"$cluster\", device=~\"^/dev/.*$\",id=\"/\"}) by (node)", + "format": "table", + "hide": true, + "instant": true, + "interval": "", + "legendFormat": "container fs used total", + "refId": "K" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum (container_fs_limit_bytes{cluster=~\"$cluster\", device=~\"^/dev/.*$\",id=\"/\"}) by (node)", + "format": "table", + "hide": true, + "instant": true, + "interval": "", + "legendFormat": "container fs limit total", + "refId": "L" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum (container_memory_working_set_bytes{cluster=~\"$cluster\", id=\"/\"})by (node) / sum (machine_memory_bytes{})by (node)", + "format": "table", + "hide": true, + "instant": true, + "interval": "", + "legendFormat": "container mem used%", + "refId": "M" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"memory\"})by (node) / sum(kube_node_status_capacity{resource=\"memory\"})by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "pod mem request %", + "refId": "N" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"memory\"})by (node) / sum(kube_node_status_capacity{resource=\"memory\"})by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "pod mem limit %", + "refId": "O" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum (rate (container_cpu_usage_seconds_total{cluster=~\"$cluster\", id=\"/\"}[2m]))by (node) / sum (machine_cpu_cores{})by (node)", + "format": "table", + "hide": true, + "instant": true, + "interval": "", + "legendFormat": "container cpu used %", + "refId": "P" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_pod_container_resource_requests{cluster=~\"$cluster\", resource=\"cpu\"})by (node) / sum(kube_node_status_allocatable{resource=\"cpu\"})by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "pod cpu request %", + "refId": "Q" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_pod_container_resource_limits{cluster=~\"$cluster\", resource=\"cpu\"})by (node) / sum(kube_node_status_allocatable{resource=\"cpu\"})by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "pod cpu limit %", + "refId": "R" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum (container_fs_usage_bytes{cluster=~\"$cluster\", device=~\"^/dev/.*$\",id=\"/\"})by (node) / sum (container_fs_limit_bytes{device=~\"^/dev/.*$\",id=\"/\"})by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "container fs used %", + "refId": "S" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "sum(kube_node_status_capacity{cluster=~\"$cluster\", resource=\"pods\"})by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "node pod capacity", + "refId": "T" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "count(kube_pod_info{cluster=~\"$cluster\", created_by_kind!~\"|Job\"}) by (node)", + "format": "table", + "hide": false, + "instant": true, + "interval": "", + "legendFormat": "running pod", + "refId": "A" + } + ], + "title": "Statistic for node", + "transformations": [ + { + "id": "seriesToColumns", + "options": { + "byField": "node" + } + }, + { + "id": "filterFieldsByName", + "options": { + "include": { + "names": [ + "node", + "condition", + "Value #B", + "Value #C", + "Value #E", + "Value #F", + "Value #D", + "Value #G", + "Value #H", + "Value #N", + "Value #O", + "Value #Q", + "Value #R", + "Value #T", + "Value #A" + ], + "pattern": "(node|condition|Value.*)" + } + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time 1": true, + "Time 10": true, + "Time 11": true, + "Time 12": true, + "Time 13": true, + "Time 14": true, + "Time 15": true, + "Time 16": true, + "Time 17": true, + "Time 18": true, + "Time 19": true, + "Time 2": true, + "Time 20": true, + "Time 3": true, + "Time 4": true, + "Time 5": true, + "Time 6": true, + "Time 7": true, + "Time 8": true, + "Time 9": true, + "Value #B": true, + "Value #E": false, + "Value #F": false, + "__name__": true, + "app_kubernetes_io_name 1": true, + "app_kubernetes_io_name 2": true, + "app_kubernetes_io_name 3": true, + "app_kubernetes_io_version 1": true, + "app_kubernetes_io_version 2": true, + "app_kubernetes_io_version 3": true, + "condition": false, + "instance 1": true, + "instance 2": true, + "instance 3": true, + "job 1": true, + "job 2": true, + "job 3": true, + "k8s_namespace 1": true, + "k8s_namespace 2": true, + "k8s_namespace 3": true, + "k8s_sname 1": true, + "k8s_sname 2": true, + "k8s_sname 3": true, + "origin_prometheus 1": true, + "origin_prometheus 2": true, + "origin_prometheus 3": true, + "status": true }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "filterable": false, - "inspect": false - }, - "mappings": [], - "noValue": "--", - "thresholds": { + "indexByName": { + "Value #A": 13, + "Value #B": 2, + "Value #C": 3, + "Value #D": 8, + "Value #E": 4, + "Value #F": 6, + "Value #G": 9, + "Value #H": 11, + "Value #N": 10, + "Value #O": 12, + "Value #Q": 5, + "Value #R": 7, + "Value #T": 14, + "condition": 1, + "node": 0 + }, + "renameByName": { + "Value #A": "pod", + "Value #C": "cpu total", + "Value #D": "mem total", + "Value #E": "cpu req", + "Value #F": "cpu limit", + "Value #G": "mem req", + "Value #H": "mem limit", + "Value #I": "cpu used", + "Value #J": "ram used", + "Value #K": "disk used", + "Value #L": "disk total", + "Value #M": "mem used%", + "Value #N": "mem req%", + "Value #O": "mem limit%", + "Value #P": "cpu used%", + "Value #Q": "cpu req%", + "Value #R": "cpu limit%", + "Value #S": "disk used%", + "Value #T": "pod capacity", + "condition": "status", + "node": "Node" + } + } + } + ], + "type": "table" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "percent" + }, + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/Total number of cores.*/" + }, + "properties": [ + { + "id": "color", + "value": { + "fixedColor": "#C4162A", + "mode": "fixed" + } + } + ] + } + ] + }, + "gridPos": { + "h": 10, + "w": 12, + "x": 0, + "y": 101 + }, + "id": 69, + "options": { + "legend": { + "calcs": [ + "mean", + "lastNotNull", + "max" + ], + "displayMode": "table", + "placement": "bottom", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum (irate(container_cpu_usage_seconds_total{cluster=~\"$cluster\", container!=\"\"}[2m])) by (node) / sum(kube_node_status_allocatable{resource=\"cpu\", unit=\"core\",cluster=~\"$cluster\"})by (node)*100 ", + "format": "time_series", + "hide": false, + "instant": false, + "interval": "", + "legendFormat": "{{node}}", + "refId": "I" + } + ], + "title": "Node CPU Usage", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "percent" + }, + "overrides": [] + }, + "gridPos": { + "h": 10, + "w": 12, + "x": 12, + "y": 101 + }, + "id": 70, + "options": { + "legend": { + "calcs": [ + "mean", + "lastNotNull", + "max" + ], + "displayMode": "table", + "placement": "bottom", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum (container_memory_working_set_bytes{cluster=~\"$cluster\", container!=\"\"})by (node) / sum(kube_node_status_allocatable{resource=\"memory\", unit=\"byte\",cluster=~\"$cluster\"})by (node)*100", + "format": "time_series", + "hide": false, + "instant": false, + "interval": "", + "legendFormat": "{{node}}", + "refId": "I" + } + ], + "title": "Node Memory Usage", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "The table shows available disk size by mount points. Only mount point that used over 50% are displayed.", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "Size" + }, + "properties": [ + { + "id": "unit", + "value": "decbits" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Available" + }, + "properties": [ + { + "id": "unit", + "value": "decbits" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Used" + }, + "properties": [ + { + "id": "unit", + "value": "decbits" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Used (%)" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "gauge" + } + }, + { + "id": "thresholds", + "value": { "mode": "absolute", "steps": [ { - "color": "light-green" - } - ] - }, - "unit": "none" - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "Used (%)" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "mode": "lcd", - "type": "gauge" - } + "color": "green", + "value": 0 }, { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "light-green" - }, - { - "color": "semi-dark-yellow", - "value": 70 - }, - { - "color": "dark-red", - "value": 80 - } - ] - } + "color": "red", + "value": 0.8 }, { - "id": "decimals", + "color": "#EAB839", "value": 1 } ] - }, - { - "matcher": { - "id": "byName", - "options": "Status" - }, - "properties": [ - { - "id": "custom.cellOptions", - "value": { - "mode": "gradient", - "type": "color-background" - } - }, - { - "id": "mappings", - "value": [ - { - "options": { - "0": { - "text": "Bound" - }, - "1": { - "text": "Pending" - }, - "2": { - "text": "Lost" - } - }, - "type": "value" - } - ] - }, - { - "id": "thresholds", - "value": { - "mode": "absolute", - "steps": [ - { - "color": "light-green" - }, - { - "color": "light-green", - "value": 0 - }, - { - "color": "semi-dark-orange", - "value": 1 - }, - { - "color": "semi-dark-red", - "value": 2 - } - ] - } - }, - { - "id": "noValue", - "value": "--" - }, - { - "id": "custom.align", - "value": "center" - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Namespace" - }, - "properties": [ - { - "id": "custom.width", - "value": 120 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Status" - }, - "properties": [ - { - "id": "custom.width", - "value": 80 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Capacity (GiB)" - }, - "properties": [ - { - "id": "custom.width", - "value": 120 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Used (GiB)" - }, - "properties": [ - { - "id": "custom.width", - "value": 120 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "Available (GiB)" - }, - "properties": [ - { - "id": "custom.width", - "value": 120 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "StorageClass" - }, - "properties": [ - { - "id": "custom.width", - "value": 150 - } - ] - }, - { - "matcher": { - "id": "byName", - "options": "PersistentVolumeClaim" - }, - "properties": [ - { - "id": "custom.width", - "value": 370 - } - ] - } - ] - }, - "gridPos": { - "h": 8, - "w": 24, - "x": 0, - "y": 25 - }, - "id": 24, - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "frameIndex": 2, - "showHeader": true, - "sortBy": [ - { - "desc": false, - "displayName": "PersistentVolumeClaim" - } - ] - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": " sum by (persistentvolumeclaim,namespace,storageclass,volumename) (kube_persistentvolumeclaim_info{})", - "format": "table", - "instant": true, - "interval": "", - "legendFormat": "", - "refId": "A" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum by (persistentvolumeclaim) (kubelet_volume_stats_capacity_bytes{}/1024/1024/1024)", - "format": "table", - "instant": true, - "interval": "", - "legendFormat": "", - "refId": "B" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum by (persistentvolumeclaim) (kubelet_volume_stats_used_bytes{}/1024/1024/1024)", - "format": "table", - "instant": true, - "interval": "", - "legendFormat": "", - "refId": "C" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum by (persistentvolumeclaim) (kubelet_volume_stats_available_bytes{}/1024/1024/1024)", - "format": "table", - "instant": true, - "interval": "", - "legendFormat": "", - "refId": "D" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum(kube_persistentvolumeclaim_status_phase{phase=~\"(Pending|Lost)\"}) by (persistentvolumeclaim) + sum(kube_persistentvolumeclaim_status_phase{phase=~\"(Lost)\"}) by (persistentvolumeclaim)", - "format": "table", - "instant": true, - "interval": "", - "legendFormat": "", - "refId": "E" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "sum by (persistentvolumeclaim) (kubelet_volume_stats_used_bytes{}/kubelet_volume_stats_capacity_bytes{} * 100)", - "format": "table", - "instant": true, - "interval": "", - "legendFormat": "", - "refId": "F" - } - ], - "title": "PVC Overview", - "transformations": [ - { - "id": "seriesToColumns", - "options": { - "byField": "persistentvolumeclaim" } }, { - "id": "organize", - "options": { - "excludeByName": { - "Time": true, - "Time 1": true, - "Time 2": true, - "Time 3": true, - "Time 4": true, - "Time 5": true, - "Time 6": true, - "Value #A": true - }, - "indexByName": {}, - "renameByName": { - "Time 1": "", - "Time 2": "", - "Time 3": "", - "Time 4": "", - "Time 5": "", - "Time 6": "", - "Value #A": "", - "Value #B": "Capacity (GiB)", - "Value #C": "Used (GiB)", - "Value #D": "Available (GiB)", - "Value #E": "Status", - "Value #F": "Used (%)", - "namespace": "Namespace", - "persistentvolumeclaim": "PersistentVolumeClaim", - "storageclass": "StorageClass", - "volumename": "PhysicalVolume" - } - } - } - ], - "type": "table" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "bytes" + "id": "unit", + "value": "percentunit" }, - "overrides": [] - }, - "gridPos": { - "h": 12, - "w": 24, - "x": 0, - "y": 33 - }, - "id": 68, - "options": { - "legend": { - "calcs": [ - "lastNotNull" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "10.4.3", - "targets": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "(max by (persistentvolumeclaim,namespace) (kubelet_volume_stats_used_bytes{}))", - "interval": "", - "legendFormat": "{{namespace}} ({{persistentvolumeclaim}})", - "range": true, - "refId": "A" - } - ], - "title": "All Running PVCs Used Bytes", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "WARNING: Any PVCs that are not bound to a running pod will not show up in this state.", - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 0, - "gradientMode": "none", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "linear", - "lineWidth": 1, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "links": [], - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "bytes" + "id": "max", + "value": 1 }, - "overrides": [] - }, - "gridPos": { - "h": 11, - "w": 24, - "x": 0, - "y": 45 - }, - "id": 78, - "options": { - "legend": { - "calcs": [ - "lastNotNull" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "asc" - } - }, - "pluginVersion": "10.4.3", - "targets": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "expr": "rate(kubelet_volume_stats_used_bytes [1d])", - "format": "time_series", - "instant": false, - "interval": "", - "intervalFactor": 1, - "legendFormat": "{{namespace}} ({{persistentvolumeclaim}})", - "refId": "A" + "id": "min", + "value": 0 } - ], - "title": "Daily Volume Use Rate (1D)", - "type": "timeseries" + ] } - ], - "title": "Volumes", - "type": "row" + ] }, - { - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 123 + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 111 + }, + "id": 46, + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false }, - "id": 1, - "panels": [ + "showHeader": true, + "sortBy": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "desc": true, + "displayName": "Used (%)" + } + ] + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(node_filesystem_free_bytes{cluster=~\"$cluster\", fstype!=\"\"}) by (instance, fstype, mountpoint)", + "format": "table", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "max by (instance, fstype, mountpoint) (node_filesystem_size_bytes{cluster=~\"$cluster\", job=\"node-exporter\", fstype!=\"\", mountpoint!=\"\"})", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "B" + } + ], + "title": "Disk by Mount Point", + "transformations": [ + { + "id": "groupBy", + "options": { + "fields": { + "Value": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #A": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #B": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "fstype": { + "aggregations": [], + "operation": "groupby" + }, + "instance": { + "aggregations": [], + "operation": "groupby" + }, + "mountpoint": { + "aggregations": [], + "operation": "groupby" + } + } + } + }, + { + "id": "merge", + "options": {} + }, + { + "id": "organize", + "options": { + "excludeByName": {}, + "indexByName": { + "Value #A (lastNotNull)": 4, + "Value #B (lastNotNull)": 3, + "fstype": 0, + "instance": 1, + "mountpoint": 2 }, - "fieldConfig": { - "defaults": { - "mappings": [ + "renameByName": { + "Value #A (lastNotNull)": "Available", + "Value #B (lastNotNull)": "Size", + "fstype": "FS Type", + "instance": "Instance", + "mountpoint": "Mountpoint" + } + } + }, + { + "id": "calculateField", + "options": { + "alias": "Used", + "binary": { + "left": "Size", + "operator": "-", + "right": "Available" + }, + "mode": "binary", + "reduce": { + "reducer": "sum" + } + } + }, + { + "id": "calculateField", + "options": { + "alias": "Used (%)", + "binary": { + "left": "Used", + "operator": "/", + "right": "Size" + }, + "mode": "binary", + "reduce": { + "reducer": "sum" + } + } + } + ], + "type": "table" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 121 + }, + "id": 20, + "panels": [], + "title": "Namespaces", + "type": "row" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "filterable": false, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "Failed Pods" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Pending Pods" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 1 + } + ] + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Unknown Pods" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 1 + } + ] + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Unscheduled Pods Last 5min" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 1 + } + ] + } + } + ] + } + ] + }, + "gridPos": { + "h": 8, + "w": 24, + "x": 0, + "y": 122 + }, + "id": 49, + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "enablePagination": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_pod_owner{cluster=~\"$cluster\", job=\"kube-state-metrics\"}) by (namespace)", + "format": "table", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "count(avg(namespace_workload_pod:kube_pod_owner:relabel{cluster=~\"$cluster\", }) by (workload, namespace)) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_pod_status_phase{cluster=~\"$cluster\", phase=\"Failed\"}) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_pod_status_phase{cluster=~\"$cluster\", phase=\"Unknown\"}) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "E" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(avg_over_time(kube_pod_status_scheduled{cluster=~\"$cluster\", condition=\"false\"}[5m])) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "F" + } + ], + "title": "Pods Status", + "transformations": [ + { + "id": "groupBy", + "options": { + "fields": { + "Value": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #A": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #B": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #C": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #D": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #E": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #F": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "namespace": { + "aggregations": [], + "operation": "groupby" + } + } + } + }, + { + "id": "merge", + "options": {} + }, + { + "id": "organize", + "options": { + "excludeByName": {}, + "indexByName": {}, + "renameByName": { + "Value #A (lastNotNull)": "Pods", + "Value #B (lastNotNull)": "Workloads", + "Value #C (lastNotNull)": "Failed Pods", + "Value #D (lastNotNull)": "Pending Pods", + "Value #E (lastNotNull)": "Unknown Pods", + "Value #F (lastNotNull)": "Unscheduled Pods Last 5min", + "namespace": "Namespace" + } + } + } + ], + "type": "table" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "decimals": 2, + "displayName": "", + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "short" + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "CPU Requests (%)" + }, + "properties": [ + { + "id": "custom.align" + }, + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + }, + { + "id": "unit", + "value": "percentunit" + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 0.8 + }, + { + "color": "red", + "value": 1 + } + ] + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "CPU Limits (%)" + }, + "properties": [ + { + "id": "unit", + "value": "percentunit" + }, + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 0.6 + }, + { + "color": "red", + "value": 0.8 + } + ] + } + } + ] + } + ] + }, + "gridPos": { + "h": 9, + "w": 24, + "x": 0, + "y": 130 + }, + "id": 63, + "interval": "1m", + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=~\"$cluster\", }) by (namespace)", + "format": "table", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(namespace_cpu:kube_pod_container_resource_requests:sum{cluster=~\"$cluster\", }) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=~\"$cluster\", }) by (namespace) / sum(namespace_cpu:kube_pod_container_resource_requests:sum{}) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(namespace_cpu:kube_pod_container_resource_limits:sum{cluster=~\"$cluster\", }) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=~\"$cluster\", }) by (namespace) / sum(namespace_cpu:kube_pod_container_resource_limits:sum{}) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "E" + } + ], + "title": "CPU Information", + "transformations": [ + { + "id": "groupBy", + "options": { + "fields": { + "Value": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #A": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #B": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #C": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #D": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #E": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "namespace": { + "aggregations": [], + "operation": "groupby" + } + } + } + }, + { + "id": "merge", + "options": {} + }, + { + "id": "organize", + "options": { + "excludeByName": {}, + "indexByName": {}, + "renameByName": { + "Value #A (lastNotNull)": "CPU Usage (vCPU)", + "Value #B (lastNotNull)": "CPU Requests (vCPU)", + "Value #C (lastNotNull)": "CPU Requests (%)", + "Value #D (lastNotNull)": "CPU Limits (vCPU)", + "Value #E (lastNotNull)": "CPU Limits (%)", + "namespace": "Namespace" + } + } + } + ], + "type": "table" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "bytes" + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "Memory Requests (%)" + }, + "properties": [ + { + "id": "unit", + "value": "percentunit" + }, + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 0.8 + }, + { + "color": "red", + "value": 1 + } + ] + } + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Memory Limits (%)" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "type": "color-background" + } + }, + { + "id": "unit", + "value": "percentunit" + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 0.6 + }, + { + "color": "red", + "value": 0.8 + } + ] + } + } + ] + } + ] + }, + "gridPos": { + "h": 8, + "w": 24, + "x": 0, + "y": 139 + }, + "id": 64, + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(container_memory_rss{cluster=~\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics/cadvisor\", container!=\"\"}) by (namespace)", + "format": "table", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(namespace_memory:kube_pod_container_resource_requests:sum{cluster=~\"$cluster\", }) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(container_memory_rss{cluster=~\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics/cadvisor\", container!=\"\"}) by (namespace) / sum(namespace_memory:kube_pod_container_resource_requests:sum{}) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(namespace_memory:kube_pod_container_resource_limits:sum{cluster=~\"$cluster\", }) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(container_memory_rss{cluster=~\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics/cadvisor\", container!=\"\"}) by (namespace) / sum(namespace_memory:kube_pod_container_resource_limits:sum{}) by (namespace)", + "format": "table", + "hide": false, + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "E" + } + ], + "title": "Memory Information", + "transformations": [ + { + "id": "groupBy", + "options": { + "fields": { + "Value #A": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #B": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #C": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #D": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "Value #E": { + "aggregations": [ + "lastNotNull" + ], + "operation": "aggregate" + }, + "namespace": { + "aggregations": [ + "lastNotNull" + ], + "operation": "groupby" + } + } + } + }, + { + "id": "merge", + "options": {} + }, + { + "id": "organize", + "options": { + "excludeByName": {}, + "indexByName": {}, + "renameByName": { + "Value #A (lastNotNull)": "Memory Usage ", + "Value #B (lastNotNull)": "Memory Requests ", + "Value #C (lastNotNull)": "Memory Requests (%)", + "Value #D (lastNotNull)": "Memory Limits", + "Value #E (lastNotNull)": "Memory Limits (%)", + "namespace": "Namespace" + } + } + } + ], + "type": "table" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 147 + }, + "id": 25, + "panels": [], + "title": "Workloads", + "type": "row" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 148 + }, + "id": 94, + "interval": "1m", + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "count(namespace_workload_pod:kube_pod_owner:relabel{cluster=~\"$cluster\"}) by (workload, workload_type, namespace)", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=~\"$cluster\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=~\"$cluster\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "B", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n kube_pod_container_resource_requests{job=\"kube-state-metrics\", resource=\"cpu\", cluster=~\"$cluster\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "C", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type, namespace)\n/sum(\n kube_pod_container_resource_requests{job=\"kube-state-metrics\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type, namespace)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "D", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n kube_pod_container_resource_limits{job=\"kube-state-metrics\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "E", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_limits{job=\"kube-state-metrics\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "F", + "step": 10 + } + ], + "title": "CPU Information", + "type": "table" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 11, + "w": 24, + "x": 0, + "y": 158 + }, + "id": 48, + "interval": "1m", + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "count(namespace_workload_pod:kube_pod_owner:relabel{cluster=~\"$cluster\"}) by (workload, workload_type, namespace)", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "A", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n container_memory_working_set_bytes{job=\"kubelet\", container!=\"\", image!=\"\",cluster=~\"$cluster\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "B", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n kube_pod_container_resource_requests{job=\"kube-state-metrics\", resource=\"memory\",cluster=~\"$cluster\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=~\"$cluster\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "C", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n container_memory_working_set_bytes{job=\"kubelet\", container!=\"\", image!=\"\",cluster=~\"$cluster\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_requests{job=\"kube-state-metrics\", resource=\"memory\",cluster=~\"$cluster\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "D", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n kube_pod_container_resource_limits{job=\"kube-state-metrics\", resource=\"memory\",cluster=~\"$cluster\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "E", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(\n container_memory_working_set_bytes{job=\"kubelet\", container!=\"\", image!=\"\",cluster=~\"$cluster\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_limits{job=\"kube-state-metrics\", resource=\"memory\",cluster=~\"$cluster\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true, + "intervalFactor": 2, + "legendFormat": "", + "refId": "F", + "step": 10 + } + ], + "title": "Memory Information", + "type": "table" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 169 + }, + "id": 72, + "panels": [], + "title": "Jobs", + "type": "row" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "rgb(31, 120, 193)", + "mode": "fixed" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "text": "N/A" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 3, + "w": 8, + "x": 0, + "y": 170 + }, + "id": 73, + "maxDataPoints": 100, + "options": { + "colorMode": "none", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_job_status_succeeded{cluster=~\"$cluster\"})", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Jobs Succeeded", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "Time" + }, + "properties": [ + { + "id": "displayName", + "value": "Time" + }, + { + "id": "unit", + "value": "time: YYYY-MM-DD HH:mm:ss" + }, + { + "id": "custom.align" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Metric" + }, + "properties": [ + { + "id": "displayName", + "value": "Job" + }, + { + "id": "unit", + "value": "short" + }, + { + "id": "decimals", + "value": 2 + }, + { + "id": "custom.align" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Value" + }, + "properties": [ + { + "id": "displayName", + "value": "Day" + }, + { + "id": "unit", + "value": "none" + }, + { + "id": "decimals", + "value": 4 + }, + { + "id": "custom.align" + } + ] + } + ] + }, + "gridPos": { + "h": 9, + "w": 8, + "x": 8, + "y": 170 + }, + "id": 76, + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true, + "sortBy": [ + { + "desc": false, + "displayName": "Day" + } + ] + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "(time()-kube_job_status_completion_time{cluster=~\"$cluster\"})/60/60/24>1", + "format": "time_series", + "instant": true, + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{job_name}}", + "refId": "A" + } + ], + "title": "Last Succeeded Jobs", + "transformations": [ + { + "id": "seriesToRows", + "options": { + "reducers": [] + } + } + ], + "type": "table" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 9, + "w": 8, + "x": 16, + "y": 170 + }, + "id": 77, + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "kube_job_status_failed{cluster=~\"$cluster\"}>=1", + "format": "time_series", + "instant": true, + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{job_name}}", + "refId": "A" + } + ], + "title": "Failed Jobs", + "transformations": [ + { + "id": "labelsToFields", + "options": { + "keepLabels": [ + "job_name", + "namespace", + "reason" + ] + } + } + ], + "type": "table" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "rgb(31, 120, 193)", + "mode": "fixed" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "text": "N/A" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 3, + "w": 8, + "x": 0, + "y": 173 + }, + "id": 74, + "maxDataPoints": 100, + "options": { + "colorMode": "none", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_job_status_active{})", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Jobs Active", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "rgb(31, 120, 193)", + "mode": "fixed" + }, + "mappings": [ + { + "options": { + "match": "null", + "result": { + "text": "N/A" + } + }, + "type": "special" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 3, + "w": 8, + "x": 0, + "y": 176 + }, + "id": 75, + "maxDataPoints": 100, + "options": { + "colorMode": "none", + "graphMode": "area", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_job_status_failed{})", + "format": "time_series", + "intervalFactor": 1, + "range": true, + "refId": "A" + } + ], + "title": "Jobs Failed", + "type": "stat" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 179 + }, + "id": 54, + "panels": [], + "title": "Pods", + "type": "row" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 24, + "x": 0, + "y": 180 + }, + "id": 123, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

CPU Information

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "orange", + "mode": "continuous-GrYlRd" + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 9, + "w": 24, + "x": 0, + "y": 182 + }, + "id": 120, + "options": { + "displayMode": "gradient", + "legend": { + "calcs": [], + "displayMode": "list", + "placement": "bottom", + "showLegend": false + }, + "maxVizHeight": 300, + "minVizHeight": 16, + "minVizWidth": 8, + "namePlacement": "auto", + "orientation": "horizontal", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showUnfilled": true, + "sizing": "auto", + "valueMode": "color" + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "952b8fca-4117-4324-92cc-fba33c458982" + }, + "editorMode": "code", + "exemplar": false, + "expr": "topk(10, sum(rate(container_cpu_usage_seconds_total{container!=\"\"}[5m])) by (pod))", + "instant": true, + "legendFormat": "{{pod}}", + "range": false, + "refId": "A" + } + ], + "title": "Top 10 CPU Consuming Pods", + "type": "bargauge" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "links": [], + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "percent" + }, + "overrides": [] + }, + "gridPos": { + "h": 12, + "w": 24, + "x": 0, + "y": 191 + }, + "id": 93, + "options": { + "legend": { + "calcs": [ + "mean", + "lastNotNull", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "max(irate(container_cpu_usage_seconds_total{container !=\"\",container!=\"POD\",cluster=~\"$cluster\"}[2m])) by (container, pod, namespace) / (max(container_spec_cpu_quota{container !=\"\",container!=\"POD\",cluster=~\"$cluster\"}/100000) by (container, pod, namespace)) * 100", + "hide": false, + "instant": false, + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{ namespace }} / {{ pod }}", + "metric": "container_cpu", + "refId": "A", + "step": 10 + } + ], + "title": "Pod Containers CPU Utilization", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "How many additional CPU was needed for container not to be in CPU Throttling", + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "auto", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 13, + "w": 12, + "x": 0, + "y": 203 + }, + "id": 121, + "options": { + "legend": { + "calcs": [ + "lastNotNull", + "mean", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "single", + "sort": "none" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "952b8fca-4117-4324-92cc-fba33c458982" + }, + "editorMode": "code", + "expr": "sum(rate(container_cpu_cfs_throttled_seconds_total{cluster=~\"$cluster\"}[5m])) by (namespace,pod) > 0", + "instant": false, + "legendFormat": "{{namespace}} / {{pod}}", + "range": true, + "refId": "A" + } + ], + "title": "CPU Throttling Seconds", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "cpu cores", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 40, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 6, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "links": [], + "mappings": [], + "max": 100, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "short" + }, + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/Throttle/" + }, + "properties": [ + { + "id": "unit", + "value": "percent" + }, + { + "id": "custom.axisLabel", + "value": "throttling percent" + } + ] + } + ] + }, + "gridPos": { + "h": 13, + "w": 12, + "x": 12, + "y": 203 + }, + "id": 119, + "options": { + "legend": { + "calcs": [ + "lastNotNull", + "mean", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "none" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "rate(container_cpu_usage_seconds_total{cluster=~\"$cluster\"}[1m])", + "legendFormat": "CPU Cores Usage {{namespace}}/{{pod}}/{{container}}", + "range": true, + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum by (namespace,pod,container) ((container_cpu_cfs_throttled_periods_total{cluster=~\"$cluster\"} / container_cpu_cfs_periods_total{cluster=~\"$cluster\"}) * 100)", + "legendFormat": "Throttle Percent {{namespace}}/{{pod}}/{{container}}", + "range": true, + "refId": "A" + } + ], + "title": "CPU Usage vs Throttling Percent", + "type": "timeseries" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 24, + "x": 0, + "y": 216 + }, + "id": 124, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

Memory Information

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "continuous-GrYlRd" + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + } + ] + }, + "unit": "bytes" + }, + "overrides": [] + }, + "gridPos": { + "h": 10, + "w": 24, + "x": 0, + "y": 218 + }, + "id": 126, + "options": { + "displayMode": "gradient", + "legend": { + "calcs": [], + "displayMode": "list", + "placement": "bottom", + "showLegend": false + }, + "maxVizHeight": 300, + "minVizHeight": 16, + "minVizWidth": 8, + "namePlacement": "auto", + "orientation": "horizontal", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showUnfilled": true, + "sizing": "auto", + "valueMode": "color" + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "952b8fca-4117-4324-92cc-fba33c458982" + }, + "editorMode": "code", + "exemplar": false, + "expr": "topk(10,sum(container_memory_working_set_bytes{container!=\"\",cluster=~\"$cluster\"}) by (pod))", + "instant": true, + "legendFormat": "__auto", + "range": false, + "refId": "A" + } + ], + "title": "Top 10 Memory Consuming Pods", + "type": "bargauge" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Pods whose Mem usage/Mem limits is more then 65%.", + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "auto", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "dashed" + } + }, + "mappings": [], + "max": 1, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 0.7 + }, + { + "color": "red", + "value": 0.8 + } + ] + }, + "unit": "percentunit" + }, + "overrides": [] + }, + "gridPos": { + "h": 11, + "w": 24, + "x": 0, + "y": 228 + }, + "id": 122, + "options": { + "legend": { + "calcs": [ + "lastNotNull", + "mean", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "single", + "sort": "none" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "952b8fca-4117-4324-92cc-fba33c458982" + }, + "editorMode": "code", + "expr": "sum(container_memory_working_set_bytes{container!=\"\", cluster=~\"$cluster\"}) by (namespace,pod) /\r\nsum(kube_pod_container_resource_limits{resource=\"memory\", cluster=~\"$cluster\"}) by (namespace,pod) > 0.65", + "instant": false, + "legendFormat": "{{ namespace }} / {{ pod }}", + "range": true, + "refId": "A" + } + ], + "title": "Pods with Potential Mem Leaks", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "links": [], + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "percent" + }, + "overrides": [] + }, + "gridPos": { + "h": 11, + "w": 24, + "x": 0, + "y": 239 + }, + "id": 95, + "options": { + "legend": { + "calcs": [ + "max", + "last", + "mean" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "max (container_memory_working_set_bytes{container !=\"\",container!=\"POD\",cluster=~\"$cluster\"}) by (namespace,container, pod)/ max(container_spec_memory_limit_bytes{container !=\"\",container!=\"POD\",cluster=~\"$cluster\"}) by (namespace,container, pod) * 100", + "interval": "", + "intervalFactor": 1, + "legendFormat": "WSS:{{ namespace }} / {{ pod }}", + "metric": "container_memory_usage:sort_desc", + "range": true, + "refId": "A", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": false, + "expr": "max (container_memory_rss{container !=\"\",container!=\"POD\",cluster=~\"$cluster\"}) by (namespace,container, pod)/ max(container_spec_memory_limit_bytes{container !=\"\",container!=\"POD\",cluster=~\"$cluster\"}) by (namespace,container, pod) * 100", + "interval": "", + "intervalFactor": 1, + "legendFormat": "RSS:{{ namespace }} / {{ pod }}", + "metric": "container_memory_usage:sort_desc", + "range": true, + "refId": "B", + "step": 10 + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "(cass_jvm_heap{} * on (namespace,pod_ip) group_right(service) kube_pod_info{cluster=~\"$cluster\"}) / (cass_jvm_heap_max{cluster=~\"$cluster\"} * on (namespace,pod_ip) group_right(service) kube_pod_info{cluster=~\"$cluster\"}) * 100", + "hide": true, + "instant": false, + "interval": "", + "intervalFactor": 1, + "legendFormat": "Heap:{{ namespace }} / {{ pod }}", + "metric": "container_memory_usage:sort_desc", + "refId": "C", + "step": 10 + } + ], + "title": "Pod Container Memory Usage", + "type": "timeseries" + }, + { + "fieldConfig": { + "defaults": {}, + "overrides": [] + }, + "gridPos": { + "h": 2, + "w": 24, + "x": 0, + "y": 250 + }, + "id": 125, + "options": { + "code": { + "language": "plaintext", + "showLineNumbers": false, + "showMiniMap": false + }, + "content": "
\n

Events

\n
\n", + "mode": "html" + }, + "pluginVersion": "12.1.0", + "title": "", + "type": "text" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 1h", + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "blue", + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "Percent", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineStyle": { + "fill": "solid" + }, + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "dashed" + } + }, + "mappings": [], + "max": 40, + "min": 0, + "thresholds": { + "mode": "percentage", + "steps": [ + { + "color": "red", + "value": 0 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 11, + "w": 24, + "x": 0, + "y": 252 + }, + "id": 104, + "options": { + "legend": { + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true, + "sortBy": "Last *", + "sortDesc": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum by (pod, container) (increase(kube_pod_container_status_restarts_total{container!=\"\",cluster=~\"$cluster\"}[1h])) > 1", + "interval": "1h", + "legendFormat": "{{ pod }} / {{ container }}", + "range": true, + "refId": "A" + } + ], + "title": "Container Restarts", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 1h", + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "blue", + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "Percent", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 25, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineStyle": { + "fill": "solid" + }, + "lineWidth": 2, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "dashed" + } + }, + "mappings": [], + "max": 50, + "min": 0, + "thresholds": { + "mode": "percentage", + "steps": [ + { + "color": "red", + "value": 0 + } + ] + }, + "unit": "none" + }, + "overrides": [] + }, + "gridPos": { + "h": 12, + "w": 24, + "x": 0, + "y": 263 + }, + "id": 103, + "options": { + "legend": { + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true, + "sortBy": "Last *", + "sortDesc": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(increase(container_oom_events_total{container!=\"\",cluster=~\"$cluster\"}[1h])) by (pod, container) > 0", + "interval": "1h", + "legendFormat": "{{ pod }} / {{ container }}", + "range": true, + "refId": "A" + } + ], + "title": "OOM Events by Container", + "type": "timeseries" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 275 + }, + "id": 23, + "panels": [], + "title": "Volumes", + "type": "row" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "filterable": false, + "inspect": false + }, + "mappings": [], + "noValue": "--", + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "light-green", + "value": 0 + } + ] + }, + "unit": "none" + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "Used (%)" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "mode": "lcd", + "type": "gauge" + } + }, + { + "id": "thresholds", + "value": { + "mode": "absolute", + "steps": [ + { + "color": "light-green", + "value": 0 + }, + { + "color": "semi-dark-yellow", + "value": 70 + }, + { + "color": "dark-red", + "value": 80 + } + ] + } + }, + { + "id": "decimals", + "value": 1 + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Status" + }, + "properties": [ + { + "id": "custom.cellOptions", + "value": { + "mode": "gradient", + "type": "color-background" + } + }, + { + "id": "mappings", + "value": [ { "options": { "0": { - "text": "DOWN" + "text": "Bound" }, "1": { - "text": "UP" + "text": "Pending" + }, + "2": { + "text": "Lost" } }, "type": "value" } - ], - "thresholds": { + ] + }, + { + "id": "thresholds", + "value": { "mode": "absolute", "steps": [ { - "color": "red" + "color": "light-green", + "value": 0 }, { - "color": "green", + "color": "light-green", + "value": 0 + }, + { + "color": "semi-dark-orange", "value": 1 + }, + { + "color": "semi-dark-red", + "value": 2 } ] } }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 12, - "x": 0, - "y": 10 - }, - "id": 2, - "options": { - "colorMode": "background", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "value_and_name", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "up{job=\"apiserver\"}", - "interval": "", - "legendFormat": "{{instance}}", - "range": true, - "refId": "A" + "id": "noValue", + "value": "--" + }, + { + "id": "custom.align", + "value": "center" } - ], - "title": "Health Status", - "type": "stat" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "Namespace" }, - "description": "Last 5Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [], - "max": 1, - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "text" - } - ] - }, - "unit": "percentunit" - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 6, - "x": 12, - "y": 10 - }, - "id": 128, - "options": { - "colorMode": "value", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "952b8fca-4117-4324-92cc-fba33c458982" - }, - "editorMode": "code", - "expr": "sum(irate(apiserver_request_total{code=~\"20.*\",verb=~\"GET|LIST\"}[5m]))/sum(irate(apiserver_request_total{verb=~\"GET|LIST\"}[5m]))", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 120 } - ], - "title": "API Server - Read Success Rate", - "type": "stat" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "Status" }, - "description": "Last 5Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "thresholds" - }, - "mappings": [], - "max": 1, - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "text" - } - ] - }, - "unit": "percentunit" - }, - "overrides": [] - }, - "gridPos": { - "h": 8, - "w": 6, - "x": 18, - "y": 10 - }, - "id": 129, - "options": { - "colorMode": "value", - "graphMode": "none", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showPercentChange": false, - "textMode": "auto", - "wideLayout": true - }, - "pluginVersion": "10.4.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "952b8fca-4117-4324-92cc-fba33c458982" - }, - "editorMode": "code", - "expr": "sum(irate(apiserver_request_total{code=~\"20.*\",verb!~\"GET|LIST|WATCH|CONNECT\"}[5m]))/sum(irate(apiserver_request_total{verb!~\"GET|LIST|WATCH|CONNECT\"}[5m]))", - "instant": false, - "legendFormat": "__auto", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 80 } - ], - "title": "API Server - Write Success Rate", - "type": "stat" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "Capacity (GiB)" }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 25, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineWidth": 2, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "decimals": 2, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "s" - }, - "overrides": [] - }, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 18 - }, - "id": 100, - "options": { - "legend": { - "calcs": [ - "lastNotNull", - "mean", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "pluginVersion": "8.3.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "rate(process_cpu_seconds_total{job=~\"kubernetes-apiservers|apiserver\"}[1m])", - "interval": "", - "legendFormat": "{{ instance }}", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 120 } - ], - "title": "API Server - CPU Usage in CPU Seconds", - "type": "timeseries" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "Used (GiB)" }, - "fieldConfig": { - "defaults": { - "custom": { - "align": "auto", - "cellOptions": { - "type": "auto" - }, - "inspect": false - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - } - }, - "overrides": [ - { - "matcher": { - "id": "byName", - "options": "_name_" - }, - "properties": [ - { - "id": "custom.width", - "value": 188 - } - ] - } - ] - }, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 18 - }, - "id": 5, - "options": { - "cellHeight": "sm", - "footer": { - "countRows": false, - "fields": "", - "reducer": [ - "sum" - ], - "show": false - }, - "showHeader": true, - "sortBy": [ - { - "desc": false, - "displayName": "removed_release" - } - ] - }, - "pluginVersion": "10.4.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "apiserver_requested_deprecated_apis", - "interval": "", - "legendFormat": "__auto", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 120 } - ], - "title": "Deprecated Kubernetes Resources", - "transformations": [ - { - "id": "labelsToFields", - "options": { - "keepLabels": [ - "group", - "job", - "removed_release", - "resource", - "version", - "name" - ], - "mode": "columns" - } - }, - { - "id": "merge", - "options": {} - }, - { - "id": "organize", - "options": { - "excludeByName": { - "Time": true, - "Value": true, - "job": true - }, - "indexByName": { - "Time": 6, - "Value": 7, - "group": 1, - "job": 5, - "namespace": 0, - "removed_release": 4, - "resource": 3, - "version": 2 - }, - "renameByName": {} - } - }, - { - "id": "groupBy", - "options": { - "fields": { - "group": { - "aggregations": [ - "lastNotNull" - ], - "operation": "groupby" - }, - "job": { - "aggregations": [], - "operation": "groupby" - }, - "namespace": { - "aggregations": [ - "lastNotNull" - ], - "operation": "groupby" - }, - "removed_release": { - "aggregations": [], - "operation": "groupby" - }, - "resource": { - "aggregations": [ - "lastNotNull" - ], - "operation": "groupby" - }, - "version": { - "aggregations": [], - "operation": "groupby" - } - } - } - } - ], - "type": "table" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "Available (GiB)" }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 25, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineWidth": 2, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "ms" - }, - "overrides": [] - }, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 27 - }, - "id": 96, - "options": { - "legend": { - "calcs": [ - "lastNotNull", - "mean", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "pluginVersion": "8.3.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(rate(apiserver_request_duration_seconds_sum{job=~\"kubernetes-apiservers|apiserver\"}[1m])) by (instance)\n/\nsum(rate(apiserver_request_duration_seconds_count{job=~\"kubernetes-apiservers|apiserver\"}[1m])) by (instance)", - "interval": "", - "legendFormat": "{{ instance }}", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 120 } - ], - "title": "API Server - HTTP Requests Latency by instance", - "type": "timeseries" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "StorageClass" }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 25, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineWidth": 2, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "bytes" - }, - "overrides": [] - }, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 27 - }, - "id": 101, - "options": { - "legend": { - "calcs": [ - "lastNotNull", - "mean", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "pluginVersion": "8.3.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "process_resident_memory_bytes{job=~\"kubernetes-apiservers|apiserver\"}", - "interval": "", - "legendFormat": "{{ instance }}", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 150 } - ], - "title": "API Server - Memory Usage by instance", - "type": "timeseries" + ] }, { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" + "matcher": { + "id": "byName", + "options": "PersistentVolumeClaim" }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 25, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineWidth": 2, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "short" - }, - "overrides": [] - }, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 36 - }, - "id": 98, - "options": { - "legend": { - "calcs": [ - "lastNotNull", - "mean", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "single", - "sort": "none" - } - }, - "pluginVersion": "8.3.3", - "targets": [ + "properties": [ { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum by(instance) (rate(apiserver_request_total{code=~\"5..\", job=~\"kubernetes-apiservers|apiserver\"}[1m]))", - "interval": "", - "legendFormat": "{{ instance }}", - "range": true, - "refId": "A" + "id": "custom.width", + "value": 370 } - ], - "title": "API Server - Errors by Instance", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "fieldConfig": { - "defaults": { - "color": { - "mode": "palette-classic" - }, - "custom": { - "axisBorderShow": false, - "axisCenteredZero": false, - "axisColorMode": "text", - "axisLabel": "", - "axisPlacement": "auto", - "barAlignment": 0, - "drawStyle": "line", - "fillOpacity": 25, - "gradientMode": "opacity", - "hideFrom": { - "legend": false, - "tooltip": false, - "viz": false - }, - "insertNulls": false, - "lineInterpolation": "smooth", - "lineWidth": 2, - "pointSize": 5, - "scaleDistribution": { - "type": "linear" - }, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - }, - "thresholdsStyle": { - "mode": "off" - } - }, - "mappings": [], - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - }, - { - "color": "red", - "value": 80 - } - ] - }, - "unit": "ms" - }, - "overrides": [] - }, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 36 - }, - "id": 97, - "options": { - "legend": { - "calcs": [ - "lastNotNull", - "mean", - "max" - ], - "displayMode": "table", - "placement": "right", - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "desc" - } - }, - "pluginVersion": "8.3.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(rate(apiserver_request_duration_seconds_sum{job=~\"kubernetes-apiservers|apiserver\"}[1m])) by (verb)\n/\nsum(rate(apiserver_request_duration_seconds_count{job=~\"kubernetes-apiservers|apiserver\"}[1m])) by (verb)", - "interval": "", - "legendFormat": "{{ verb }}", - "range": true, - "refId": "A" - } - ], - "title": "API Server - HTTP Requests Latency by verb", - "type": "timeseries" - }, - { - "datasource": { - "type": "prometheus", - "uid": "${DATASOURCE}" - }, - "description": "Last 5Min", - "fieldConfig": { - "defaults": { - "color": { - "mode": "continuous-GrYlRd" - }, - "mappings": [], - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ - { - "color": "green" - } - ] - }, - "unit": "dtdurations" - }, - "overrides": [] - }, - "gridPos": { - "h": 12, - "w": 24, - "x": 0, - "y": 45 - }, - "id": 130, - "options": { - "displayMode": "gradient", - "maxVizHeight": 300, - "minVizHeight": 16, - "minVizWidth": 8, - "namePlacement": "auto", - "orientation": "horizontal", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "showUnfilled": true, - "sizing": "auto", - "valueMode": "color" - }, - "pluginVersion": "10.4.3", - "targets": [ - { - "datasource": { - "type": "prometheus", - "uid": "952b8fca-4117-4324-92cc-fba33c458982" - }, - "editorMode": "code", - "exemplar": false, - "expr": "topk(10, cluster_quantile:apiserver_request_duration_seconds:histogram_quantile{job=~\".+\",quantile=\"0.9\", subresource=\"\"})", - "instant": true, - "legendFormat": "{{resource}}:{{verb}}", - "range": false, - "refId": "A" - } - ], - "title": "Slowest Requests (Top 10) ", - "type": "bargauge" + ] } - ], - "title": "API Server", - "type": "row" - } - ], - "preload": false, - "refresh": "", - "schemaVersion": 40, - "tags": [], - "templating": { - "list": [ + ] + }, + "gridPos": { + "h": 8, + "w": 24, + "x": 0, + "y": 276 + }, + "id": 24, + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "frameIndex": 2, + "showHeader": true, + "sortBy": [ + { + "desc": false, + "displayName": "PersistentVolumeClaim" + } + ] + }, + "pluginVersion": "12.1.0", + "targets": [ { - "current": {}, - "includeAll": false, - "label": "Datasource", - "name": "DATASOURCE", - "options": [], - "query": "prometheus", - "refresh": 1, - "regex": "", - "type": "datasource" + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": " sum by (persistentvolumeclaim,namespace,storageclass,volumename) (kube_persistentvolumeclaim_info{cluster=~\"$cluster\"})", + "format": "table", + "instant": true, + "interval": "", + "legendFormat": "", + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum by (persistentvolumeclaim) (kubelet_volume_stats_capacity_bytes{cluster=~\"$cluster\"}/1024/1024/1024)", + "format": "table", + "instant": true, + "interval": "", + "legendFormat": "", + "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum by (persistentvolumeclaim) (kubelet_volume_stats_used_bytes{cluster=~\"$cluster\"}/1024/1024/1024)", + "format": "table", + "instant": true, + "interval": "", + "legendFormat": "", + "refId": "C" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum by (persistentvolumeclaim) (kubelet_volume_stats_available_bytes{cluster=~\"$cluster\"}/1024/1024/1024)", + "format": "table", + "instant": true, + "interval": "", + "legendFormat": "", + "refId": "D" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum(kube_persistentvolumeclaim_status_phase{phase=~\"(Pending|Lost)\",cluster=~\"$cluster\"}) by (persistentvolumeclaim) + sum(kube_persistentvolumeclaim_status_phase{phase=~\"(Lost)\",cluster=~\"$cluster\"}) by (persistentvolumeclaim)", + "format": "table", + "instant": true, + "interval": "", + "legendFormat": "", + "refId": "E" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "sum by (persistentvolumeclaim) (kubelet_volume_stats_used_bytes{cluster=~\"$cluster\"}/kubelet_volume_stats_capacity_bytes{cluster=~\"$cluster\"} * 100)", + "format": "table", + "instant": true, + "interval": "", + "legendFormat": "", + "refId": "F" } - ] + ], + "title": "PVC Overview", + "transformations": [ + { + "id": "seriesToColumns", + "options": { + "byField": "persistentvolumeclaim" + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Time 1": true, + "Time 2": true, + "Time 3": true, + "Time 4": true, + "Time 5": true, + "Time 6": true, + "Value #A": true + }, + "indexByName": {}, + "renameByName": { + "Time 1": "", + "Time 2": "", + "Time 3": "", + "Time 4": "", + "Time 5": "", + "Time 6": "", + "Value #A": "", + "Value #B": "Capacity (GiB)", + "Value #C": "Used (GiB)", + "Value #D": "Available (GiB)", + "Value #E": "Status", + "Value #F": "Used (%)", + "namespace": "Namespace", + "persistentvolumeclaim": "PersistentVolumeClaim", + "storageclass": "StorageClass", + "volumename": "PhysicalVolume" + } + } + } + ], + "type": "table" }, - "time": { - "from": "now-6h", - "to": "now" + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "bytes" + }, + "overrides": [] + }, + "gridPos": { + "h": 12, + "w": 24, + "x": 0, + "y": 284 + }, + "id": 68, + "options": { + "legend": { + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "(max by (persistentvolumeclaim,namespace) (kubelet_volume_stats_used_bytes{cluster=~\"$cluster\"}))", + "interval": "", + "legendFormat": "{{namespace}} ({{persistentvolumeclaim}})", + "range": true, + "refId": "A" + } + ], + "title": "All Running PVCs Used Bytes", + "type": "timeseries" }, - "timepicker": {}, - "timezone": "", - "title": "Kubernetes / Overview", - "uid": "k8s-overview-uid", - "version": 1, - "weekStart": "" - } \ No newline at end of file + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "WARNING: Any PVCs that are not bound to a running pod will not show up in this state.", + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 0, + "gradientMode": "none", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "linear", + "lineWidth": 1, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "links": [], + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "bytes" + }, + "overrides": [] + }, + "gridPos": { + "h": 11, + "w": 24, + "x": 0, + "y": 296 + }, + "id": 78, + "options": { + "legend": { + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "asc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "expr": "rate(kubelet_volume_stats_used_bytes{cluster=~\"$cluster\"} [1d])", + "format": "time_series", + "instant": false, + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{namespace}} ({{persistentvolumeclaim}})", + "refId": "A" + } + ], + "title": "Daily Volume Use Rate (1D)", + "type": "timeseries" + }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 307 + }, + "id": 1, + "panels": [], + "title": "API Server", + "type": "row" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "mappings": [ + { + "options": { + "0": { + "text": "DOWN" + }, + "1": { + "text": "UP" + } + }, + "type": "value" + } + ], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "red", + "value": 0 + }, + { + "color": "green", + "value": 1 + } + ] + } + }, + "overrides": [] + }, + "gridPos": { + "h": 8, + "w": 12, + "x": 0, + "y": 308 + }, + "id": 2, + "options": { + "colorMode": "background", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "horizontal", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "value_and_name", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "up{job=\"apiserver\", cluster=~\"$cluster\"}", + "interval": "", + "legendFormat": "{{instance}}", + "range": true, + "refId": "A" + } + ], + "title": "Health Status", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 5Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [], + "max": 1, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "text", + "value": 0 + } + ] + }, + "unit": "percentunit" + }, + "overrides": [] + }, + "gridPos": { + "h": 8, + "w": 6, + "x": 12, + "y": 308 + }, + "id": 128, + "options": { + "colorMode": "value", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "auto", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "952b8fca-4117-4324-92cc-fba33c458982" + }, + "editorMode": "code", + "expr": "sum(irate(apiserver_request_total{code=~\"20.*\",verb=~\"GET|LIST\",cluster=~\"$cluster\"}[5m]))/sum(irate(apiserver_request_total{verb=~\"GET|LIST\",cluster=~\"$cluster\"}[5m]))", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + } + ], + "title": "API Server - Read Success Rate", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 5Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "mappings": [], + "max": 1, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "text", + "value": 0 + } + ] + }, + "unit": "percentunit" + }, + "overrides": [] + }, + "gridPos": { + "h": 8, + "w": 6, + "x": 18, + "y": 308 + }, + "id": 129, + "options": { + "colorMode": "value", + "graphMode": "none", + "justifyMode": "auto", + "orientation": "auto", + "percentChangeColorMode": "standard", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showPercentChange": false, + "textMode": "auto", + "wideLayout": true + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "952b8fca-4117-4324-92cc-fba33c458982" + }, + "editorMode": "code", + "expr": "sum(irate(apiserver_request_total{code=~\"20.*\",verb!~\"GET|LIST|WATCH|CONNECT\",cluster=~\"$cluster\"}[5m]))/sum(irate(apiserver_request_total{verb!~\"GET|LIST|WATCH|CONNECT\",cluster=~\"$cluster\"}[5m]))", + "instant": false, + "legendFormat": "__auto", + "range": true, + "refId": "A" + } + ], + "title": "API Server - Write Success Rate", + "type": "stat" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 25, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineWidth": 2, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "decimals": 2, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "s" + }, + "overrides": [] + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 316 + }, + "id": 100, + "options": { + "legend": { + "calcs": [ + "lastNotNull", + "mean", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "single", + "sort": "none" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "rate(process_cpu_seconds_total{job=~\"kubernetes-apiservers|apiserver\",cluster=~\"$cluster\"}[1m])", + "interval": "", + "legendFormat": "{{ instance }}", + "range": true, + "refId": "A" + } + ], + "title": "API Server - CPU Usage in CPU Seconds", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "custom": { + "align": "auto", + "cellOptions": { + "type": "auto" + }, + "inspect": false + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + } + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "_name_" + }, + "properties": [ + { + "id": "custom.width", + "value": 188 + } + ] + } + ] + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 316 + }, + "id": 5, + "options": { + "cellHeight": "sm", + "footer": { + "countRows": false, + "fields": "", + "reducer": [ + "sum" + ], + "show": false + }, + "showHeader": true, + "sortBy": [ + { + "desc": false, + "displayName": "removed_release" + } + ] + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "apiserver_requested_deprecated_apis{cluster=~\"$cluster\"}", + "interval": "", + "legendFormat": "__auto", + "range": true, + "refId": "A" + } + ], + "title": "Deprecated Kubernetes Resources", + "transformations": [ + { + "id": "labelsToFields", + "options": { + "keepLabels": [ + "group", + "job", + "removed_release", + "resource", + "version", + "name" + ], + "mode": "columns" + } + }, + { + "id": "merge", + "options": {} + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Value": true, + "job": true + }, + "indexByName": { + "Time": 6, + "Value": 7, + "group": 1, + "job": 5, + "namespace": 0, + "removed_release": 4, + "resource": 3, + "version": 2 + }, + "renameByName": {} + } + }, + { + "id": "groupBy", + "options": { + "fields": { + "group": { + "aggregations": [ + "lastNotNull" + ], + "operation": "groupby" + }, + "job": { + "aggregations": [], + "operation": "groupby" + }, + "namespace": { + "aggregations": [ + "lastNotNull" + ], + "operation": "groupby" + }, + "removed_release": { + "aggregations": [], + "operation": "groupby" + }, + "resource": { + "aggregations": [ + "lastNotNull" + ], + "operation": "groupby" + }, + "version": { + "aggregations": [], + "operation": "groupby" + } + } + } + } + ], + "type": "table" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 25, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineWidth": 2, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "ms" + }, + "overrides": [] + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 325 + }, + "id": 96, + "options": { + "legend": { + "calcs": [ + "lastNotNull", + "mean", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "single", + "sort": "none" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(rate(apiserver_request_duration_seconds_sum{job=~\"kubernetes-apiservers|apiserver\",cluster=~\"$cluster\"}[1m])) by (instance)\n/\nsum(rate(apiserver_request_duration_seconds_count{job=~\"kubernetes-apiservers|apiserver\",cluster=~\"$cluster\"}[1m])) by (instance)", + "interval": "", + "legendFormat": "{{ instance }}", + "range": true, + "refId": "A" + } + ], + "title": "API Server - HTTP Requests Latency by instance", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 25, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineWidth": 2, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "bytes" + }, + "overrides": [] + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 325 + }, + "id": 101, + "options": { + "legend": { + "calcs": [ + "lastNotNull", + "mean", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "single", + "sort": "none" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "process_resident_memory_bytes{job=~\"kubernetes-apiservers|apiserver\",cluster=~\"$cluster\"}", + "interval": "", + "legendFormat": "{{ instance }}", + "range": true, + "refId": "A" + } + ], + "title": "API Server - Memory Usage by instance", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 25, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineWidth": 2, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "short" + }, + "overrides": [] + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 334 + }, + "id": 98, + "options": { + "legend": { + "calcs": [ + "lastNotNull", + "mean", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "single", + "sort": "none" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum by(instance) (rate(apiserver_request_total{code=~\"5..\", job=~\"kubernetes-apiservers|apiserver\"}[1m]))", + "interval": "", + "legendFormat": "{{ instance }}", + "range": true, + "refId": "A" + } + ], + "title": "API Server - Errors by Instance", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "palette-classic" + }, + "custom": { + "axisBorderShow": false, + "axisCenteredZero": false, + "axisColorMode": "text", + "axisLabel": "", + "axisPlacement": "auto", + "barAlignment": 0, + "barWidthFactor": 0.6, + "drawStyle": "line", + "fillOpacity": 25, + "gradientMode": "opacity", + "hideFrom": { + "legend": false, + "tooltip": false, + "viz": false + }, + "insertNulls": false, + "lineInterpolation": "smooth", + "lineWidth": 2, + "pointSize": 5, + "scaleDistribution": { + "type": "linear" + }, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + }, + "thresholdsStyle": { + "mode": "off" + } + }, + "mappings": [], + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "red", + "value": 80 + } + ] + }, + "unit": "ms" + }, + "overrides": [] + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 334 + }, + "id": 97, + "options": { + "legend": { + "calcs": [ + "lastNotNull", + "mean", + "max" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "hideZeros": false, + "mode": "multi", + "sort": "desc" + } + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(rate(apiserver_request_duration_seconds_sum{job=~\"kubernetes-apiservers|apiserver\"}[1m])) by (verb)\n/\nsum(rate(apiserver_request_duration_seconds_count{job=~\"kubernetes-apiservers|apiserver\"}[1m])) by (verb)", + "interval": "", + "legendFormat": "{{ verb }}", + "range": true, + "refId": "A" + } + ], + "title": "API Server - HTTP Requests Latency by verb", + "type": "timeseries" + }, + { + "datasource": { + "type": "prometheus", + "uid": "Mimir" + }, + "description": "Last 5Min", + "fieldConfig": { + "defaults": { + "color": { + "mode": "continuous-GrYlRd" + }, + "mappings": [], + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + } + ] + }, + "unit": "dtdurations" + }, + "overrides": [] + }, + "gridPos": { + "h": 12, + "w": 24, + "x": 0, + "y": 343 + }, + "id": 130, + "options": { + "displayMode": "gradient", + "legend": { + "calcs": [], + "displayMode": "list", + "placement": "bottom", + "showLegend": false + }, + "maxVizHeight": 300, + "minVizHeight": 16, + "minVizWidth": 8, + "namePlacement": "auto", + "orientation": "horizontal", + "reduceOptions": { + "calcs": [ + "lastNotNull" + ], + "fields": "", + "values": false + }, + "showUnfilled": true, + "sizing": "auto", + "valueMode": "color" + }, + "pluginVersion": "12.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "952b8fca-4117-4324-92cc-fba33c458982" + }, + "editorMode": "code", + "exemplar": false, + "expr": "topk(10, cluster_quantile:apiserver_request_duration_seconds:histogram_quantile{job=~\".+\",quantile=\"0.9\", subresource=\"\"})", + "instant": true, + "legendFormat": "{{resource}}:{{verb}}", + "range": false, + "refId": "A" + } + ], + "title": "Slowest Requests (Top 10) ", + "type": "bargauge" + } + ], + "preload": false, + "refresh": "", + "schemaVersion": 41, + "tags": [], + "templating": { + "list": [ + { + "current": { + "text": "All", + "value": "$__all" + }, + "definition": "label_values(kube_node_info,cluster)", + "includeAll": true, + "label": "Cluster", + "name": "cluster", + "options": [], + "query": { + "qryType": 1, + "query": "label_values(kube_node_info,cluster)", + "refId": "PrometheusVariableQueryEditor-VariableQuery" + }, + "refresh": 1, + "regex": "", + "type": "query" + } + ] + }, + "time": { + "from": "now-6h", + "to": "now" + }, + "timepicker": {}, + "timezone": "", + "title": "Kubernetes / Overview to change", + "uid": "new_kuber", + "version": 22 +} \ No newline at end of file