1 # Licensed under the Apache License, Version 2.0 (the "License");
2 # you may not use this file except in compliance with the License.
3 # You may obtain a copy of the License at
5 # http://www.apache.org/licenses/LICENSE-2.0
7 # Unless required by applicable law or agreed to in writing, software
8 # distributed under the License is distributed on an "AS IS" BASIS,
9 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10 # See the License for the specific language governing permissions and
11 # limitations under the License.
14 Generated from 'kubelet' from https://raw.githubusercontent.com/prometheus-operator/kube-prometheus/master/manifests/grafana-dashboardDefinitions.yaml
15 Do not change in-place! In order to change this file first read following link:
16 https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack/hack
18 {{- $kubeTargetVersion := default .Capabilities.KubeVersion.GitVersion .Values.kubeTargetVersionOverride }}
19 {{- if and (or .Values.grafana.enabled .Values.grafana.forceDeployDashboards) (semverCompare ">=1.14.0-0" $kubeTargetVersion) (semverCompare "<9.9.9-9" $kubeTargetVersion) .Values.grafana.defaultDashboardsEnabled .Values.kubelet.enabled }}
23 namespace: {{ template "kube-prometheus-stack.namespace" . }}
24 name: {{ printf "%s-%s" (include "kube-prometheus-stack.fullname" $) "kubelet" | trunc 63 | trimSuffix "-" }}
26 {{ toYaml .Values.grafana.sidecar.dashboards.annotations | indent 4 }}
28 {{- if $.Values.grafana.sidecar.dashboards.label }}
29 {{ $.Values.grafana.sidecar.dashboards.label }}: "1"
31 app: {{ template "kube-prometheus-stack.name" $ }}-grafana
32 {{ include "kube-prometheus-stack.labels" $ | indent 4 }}
50 "hideControls": false,
63 "colorBackground": false,
67 "rgba(237, 129, 40, 0.89)",
70 "datasource": "$datasource",
76 "thresholdLabels": false,
77 "thresholdMarkers": true
90 "name": "value to text",
94 "name": "range to text",
99 "nullPointMode": "connected",
102 "postfixFontSize": "50%",
104 "prefixFontSize": "50%",
114 "fillColor": "rgba(31, 118, 189, 0.18)",
116 "lineColor": "rgb(31, 120, 193)",
122 "expr": "sum(kubelet_node_name{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\"})",
123 "format": "time_series",
130 "title": "Running Kubelets",
134 "type": "singlestat",
135 "valueFontSize": "80%",
146 "cacheTimeout": null,
147 "colorBackground": false,
151 "rgba(237, 129, 40, 0.89)",
154 "datasource": "$datasource",
160 "thresholdLabels": false,
161 "thresholdMarkers": true
174 "name": "value to text",
178 "name": "range to text",
182 "maxDataPoints": 100,
183 "nullPointMode": "connected",
186 "postfixFontSize": "50%",
188 "prefixFontSize": "50%",
198 "fillColor": "rgba(31, 118, 189, 0.18)",
200 "lineColor": "rgb(31, 120, 193)",
206 "expr": "sum(kubelet_running_pods{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"}) OR sum(kubelet_running_pod_count{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"})",
207 "format": "time_series",
209 "legendFormat": "{{`{{`}}instance{{`}}`}}",
214 "title": "Running Pods",
218 "type": "singlestat",
219 "valueFontSize": "80%",
230 "cacheTimeout": null,
231 "colorBackground": false,
235 "rgba(237, 129, 40, 0.89)",
238 "datasource": "$datasource",
244 "thresholdLabels": false,
245 "thresholdMarkers": true
258 "name": "value to text",
262 "name": "range to text",
266 "maxDataPoints": 100,
267 "nullPointMode": "connected",
270 "postfixFontSize": "50%",
272 "prefixFontSize": "50%",
282 "fillColor": "rgba(31, 118, 189, 0.18)",
284 "lineColor": "rgb(31, 120, 193)",
290 "expr": "sum(kubelet_running_containers{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"}) OR sum(kubelet_running_container_count{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"})",
291 "format": "time_series",
293 "legendFormat": "{{`{{`}}instance{{`}}`}}",
298 "title": "Running Container",
302 "type": "singlestat",
303 "valueFontSize": "80%",
314 "cacheTimeout": null,
315 "colorBackground": false,
319 "rgba(237, 129, 40, 0.89)",
322 "datasource": "$datasource",
328 "thresholdLabels": false,
329 "thresholdMarkers": true
342 "name": "value to text",
346 "name": "range to text",
350 "maxDataPoints": 100,
351 "nullPointMode": "connected",
354 "postfixFontSize": "50%",
356 "prefixFontSize": "50%",
366 "fillColor": "rgba(31, 118, 189, 0.18)",
368 "lineColor": "rgb(31, 120, 193)",
374 "expr": "sum(volume_manager_total_volumes{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\", state=\"actual_state_of_world\"})",
375 "format": "time_series",
377 "legendFormat": "{{`{{`}}instance{{`}}`}}",
382 "title": "Actual Volume Count",
386 "type": "singlestat",
387 "valueFontSize": "80%",
398 "cacheTimeout": null,
399 "colorBackground": false,
403 "rgba(237, 129, 40, 0.89)",
406 "datasource": "$datasource",
412 "thresholdLabels": false,
413 "thresholdMarkers": true
426 "name": "value to text",
430 "name": "range to text",
434 "maxDataPoints": 100,
435 "nullPointMode": "connected",
438 "postfixFontSize": "50%",
440 "prefixFontSize": "50%",
450 "fillColor": "rgba(31, 118, 189, 0.18)",
452 "lineColor": "rgb(31, 120, 193)",
458 "expr": "sum(volume_manager_total_volumes{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\",state=\"desired_state_of_world\"})",
459 "format": "time_series",
461 "legendFormat": "{{`{{`}}instance{{`}}`}}",
466 "title": "Desired Volume Count",
470 "type": "singlestat",
471 "valueFontSize": "80%",
482 "cacheTimeout": null,
483 "colorBackground": false,
487 "rgba(237, 129, 40, 0.89)",
490 "datasource": "$datasource",
496 "thresholdLabels": false,
497 "thresholdMarkers": true
510 "name": "value to text",
514 "name": "range to text",
518 "maxDataPoints": 100,
519 "nullPointMode": "connected",
522 "postfixFontSize": "50%",
524 "prefixFontSize": "50%",
534 "fillColor": "rgba(31, 118, 189, 0.18)",
536 "lineColor": "rgb(31, 120, 193)",
542 "expr": "sum(rate(kubelet_node_config_error{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"}[5m]))",
543 "format": "time_series",
545 "legendFormat": "{{`{{`}}instance{{`}}`}}",
550 "title": "Config Error Count",
554 "type": "singlestat",
555 "valueFontSize": "80%",
567 "repeatIteration": null,
570 "title": "Dashboard Row",
585 "datasource": "$datasource",
593 "alignAsTable": true,
609 "nullPointMode": "null",
621 "steppedLine": false,
624 "expr": "sum(rate(kubelet_runtime_operations_total{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (operation_type, instance)",
625 "format": "time_series",
627 "legendFormat": "{{`{{`}}instance{{`}}`}} {{`{{`}}operation_type{{`}}`}}",
636 "title": "Operation Rate",
640 "value_type": "individual"
678 "datasource": "$datasource",
686 "alignAsTable": true,
702 "nullPointMode": "null",
714 "steppedLine": false,
717 "expr": "sum(rate(kubelet_runtime_operations_errors_total{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance, operation_type)",
718 "format": "time_series",
720 "legendFormat": "{{`{{`}}instance{{`}}`}} {{`{{`}}operation_type{{`}}`}}",
729 "title": "Operation Error Rate",
733 "value_type": "individual"
766 "repeatIteration": null,
769 "title": "Dashboard Row",
784 "datasource": "$datasource",
792 "alignAsTable": true,
808 "nullPointMode": "null",
820 "steppedLine": false,
823 "expr": "histogram_quantile(0.99, sum(rate(kubelet_runtime_operations_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance, operation_type, le))",
824 "format": "time_series",
826 "legendFormat": "{{`{{`}}instance{{`}}`}} {{`{{`}}operation_type{{`}}`}}",
835 "title": "Operation duration 99th quantile",
839 "value_type": "individual"
872 "repeatIteration": null,
875 "title": "Dashboard Row",
890 "datasource": "$datasource",
898 "alignAsTable": true,
914 "nullPointMode": "null",
926 "steppedLine": false,
929 "expr": "sum(rate(kubelet_pod_start_duration_seconds_count{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance)",
930 "format": "time_series",
932 "legendFormat": "{{`{{`}}instance{{`}}`}} pod",
936 "expr": "sum(rate(kubelet_pod_worker_duration_seconds_count{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance)",
937 "format": "time_series",
939 "legendFormat": "{{`{{`}}instance{{`}}`}} worker",
948 "title": "Pod Start Rate",
952 "value_type": "individual"
990 "datasource": "$datasource",
998 "alignAsTable": true,
1014 "nullPointMode": "null",
1015 "percentage": false,
1020 "seriesOverrides": [
1026 "steppedLine": false,
1029 "expr": "histogram_quantile(0.99, sum(rate(kubelet_pod_start_duration_seconds_count{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance, le))",
1030 "format": "time_series",
1031 "intervalFactor": 2,
1032 "legendFormat": "{{`{{`}}instance{{`}}`}} pod",
1036 "expr": "histogram_quantile(0.99, sum(rate(kubelet_pod_worker_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance, le))",
1037 "format": "time_series",
1038 "intervalFactor": 2,
1039 "legendFormat": "{{`{{`}}instance{{`}}`}} worker",
1048 "title": "Pod Start Duration",
1052 "value_type": "individual"
1085 "repeatIteration": null,
1086 "repeatRowId": null,
1088 "title": "Dashboard Row",
1103 "datasource": "$datasource",
1111 "alignAsTable": true,
1129 "nullPointMode": "null",
1130 "percentage": false,
1135 "seriesOverrides": [
1141 "steppedLine": false,
1144 "expr": "sum(rate(storage_operation_duration_seconds_count{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin)",
1145 "format": "time_series",
1146 "intervalFactor": 2,
1147 "legendFormat": "{{`{{`}}instance{{`}}`}} {{`{{`}}operation_name{{`}}`}} {{`{{`}}volume_plugin{{`}}`}}",
1156 "title": "Storage Operation Rate",
1160 "value_type": "individual"
1198 "datasource": "$datasource",
1206 "alignAsTable": true,
1224 "nullPointMode": "null",
1225 "percentage": false,
1230 "seriesOverrides": [
1236 "steppedLine": false,
1239 "expr": "sum(rate(storage_operation_errors_total{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin)",
1240 "format": "time_series",
1241 "intervalFactor": 2,
1242 "legendFormat": "{{`{{`}}instance{{`}}`}} {{`{{`}}operation_name{{`}}`}} {{`{{`}}volume_plugin{{`}}`}}",
1251 "title": "Storage Operation Error Rate",
1255 "value_type": "individual"
1288 "repeatIteration": null,
1289 "repeatRowId": null,
1291 "title": "Dashboard Row",
1306 "datasource": "$datasource",
1314 "alignAsTable": true,
1332 "nullPointMode": "null",
1333 "percentage": false,
1338 "seriesOverrides": [
1344 "steppedLine": false,
1347 "expr": "histogram_quantile(0.99, sum(rate(storage_operation_duration_seconds_bucket{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin, le))",
1348 "format": "time_series",
1349 "intervalFactor": 2,
1350 "legendFormat": "{{`{{`}}instance{{`}}`}} {{`{{`}}operation_name{{`}}`}} {{`{{`}}volume_plugin{{`}}`}}",
1359 "title": "Storage Operation Duration 99th quantile",
1363 "value_type": "individual"
1396 "repeatIteration": null,
1397 "repeatRowId": null,
1399 "title": "Dashboard Row",
1414 "datasource": "$datasource",
1422 "alignAsTable": true,
1438 "nullPointMode": "null",
1439 "percentage": false,
1444 "seriesOverrides": [
1450 "steppedLine": false,
1453 "expr": "sum(rate(kubelet_cgroup_manager_duration_seconds_count{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"}[5m])) by (instance, operation_type)",
1454 "format": "time_series",
1455 "intervalFactor": 2,
1456 "legendFormat": "{{`{{`}}operation_type{{`}}`}}",
1465 "title": "Cgroup manager operation rate",
1469 "value_type": "individual"
1507 "datasource": "$datasource",
1515 "alignAsTable": true,
1531 "nullPointMode": "null",
1532 "percentage": false,
1537 "seriesOverrides": [
1543 "steppedLine": false,
1546 "expr": "histogram_quantile(0.99, sum(rate(kubelet_cgroup_manager_duration_seconds_bucket{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"}[5m])) by (instance, operation_type, le))",
1547 "format": "time_series",
1548 "intervalFactor": 2,
1549 "legendFormat": "{{`{{`}}instance{{`}}`}} {{`{{`}}operation_type{{`}}`}}",
1558 "title": "Cgroup manager 99th quantile",
1562 "value_type": "individual"
1595 "repeatIteration": null,
1596 "repeatRowId": null,
1598 "title": "Dashboard Row",
1613 "datasource": "$datasource",
1614 "description": "Pod lifecycle event generator",
1622 "alignAsTable": true,
1638 "nullPointMode": "null",
1639 "percentage": false,
1644 "seriesOverrides": [
1650 "steppedLine": false,
1653 "expr": "sum(rate(kubelet_pleg_relist_duration_seconds_count{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"}[5m])) by (instance)",
1654 "format": "time_series",
1655 "intervalFactor": 2,
1656 "legendFormat": "{{`{{`}}instance{{`}}`}}",
1665 "title": "PLEG relist rate",
1669 "value_type": "individual"
1707 "datasource": "$datasource",
1715 "alignAsTable": true,
1731 "nullPointMode": "null",
1732 "percentage": false,
1737 "seriesOverrides": [
1743 "steppedLine": false,
1746 "expr": "histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_interval_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance, le))",
1747 "format": "time_series",
1748 "intervalFactor": 2,
1749 "legendFormat": "{{`{{`}}instance{{`}}`}}",
1758 "title": "PLEG relist interval",
1762 "value_type": "individual"
1795 "repeatIteration": null,
1796 "repeatRowId": null,
1798 "title": "Dashboard Row",
1813 "datasource": "$datasource",
1821 "alignAsTable": true,
1837 "nullPointMode": "null",
1838 "percentage": false,
1843 "seriesOverrides": [
1849 "steppedLine": false,
1852 "expr": "histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])) by (instance, le))",
1853 "format": "time_series",
1854 "intervalFactor": 2,
1855 "legendFormat": "{{`{{`}}instance{{`}}`}}",
1864 "title": "PLEG relist duration",
1868 "value_type": "individual"
1901 "repeatIteration": null,
1902 "repeatRowId": null,
1904 "title": "Dashboard Row",
1919 "datasource": "$datasource",
1927 "alignAsTable": false,
1943 "nullPointMode": "null",
1944 "percentage": false,
1949 "seriesOverrides": [
1955 "steppedLine": false,
1958 "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\",code=~\"2..\"}[5m]))",
1959 "format": "time_series",
1960 "intervalFactor": 2,
1961 "legendFormat": "2xx",
1965 "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\",code=~\"3..\"}[5m]))",
1966 "format": "time_series",
1967 "intervalFactor": 2,
1968 "legendFormat": "3xx",
1972 "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\",code=~\"4..\"}[5m]))",
1973 "format": "time_series",
1974 "intervalFactor": 2,
1975 "legendFormat": "4xx",
1979 "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\",code=~\"5..\"}[5m]))",
1980 "format": "time_series",
1981 "intervalFactor": 2,
1982 "legendFormat": "5xx",
1991 "title": "RPC Rate",
1995 "value_type": "individual"
2028 "repeatIteration": null,
2029 "repeatRowId": null,
2031 "title": "Dashboard Row",
2046 "datasource": "$datasource",
2054 "alignAsTable": true,
2070 "nullPointMode": "null",
2071 "percentage": false,
2076 "seriesOverrides": [
2082 "steppedLine": false,
2085 "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\", instance=~\"$instance\"}[5m])) by (instance, verb, url, le))",
2086 "format": "time_series",
2087 "intervalFactor": 2,
2088 "legendFormat": "{{`{{`}}instance{{`}}`}} {{`{{`}}verb{{`}}`}} {{`{{`}}url{{`}}`}}",
2097 "title": "Request duration 99th quantile",
2101 "value_type": "individual"
2134 "repeatIteration": null,
2135 "repeatRowId": null,
2137 "title": "Dashboard Row",
2152 "datasource": "$datasource",
2160 "alignAsTable": false,
2176 "nullPointMode": "null",
2177 "percentage": false,
2182 "seriesOverrides": [
2188 "steppedLine": false,
2191 "expr": "process_resident_memory_bytes{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}",
2192 "format": "time_series",
2193 "intervalFactor": 2,
2194 "legendFormat": "{{`{{`}}instance{{`}}`}}",
2207 "value_type": "individual"
2245 "datasource": "$datasource",
2253 "alignAsTable": false,
2269 "nullPointMode": "null",
2270 "percentage": false,
2275 "seriesOverrides": [
2281 "steppedLine": false,
2284 "expr": "rate(process_cpu_seconds_total{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}[5m])",
2285 "format": "time_series",
2286 "intervalFactor": 2,
2287 "legendFormat": "{{`{{`}}instance{{`}}`}}",
2296 "title": "CPU usage",
2300 "value_type": "individual"
2338 "datasource": "$datasource",
2346 "alignAsTable": false,
2362 "nullPointMode": "null",
2363 "percentage": false,
2368 "seriesOverrides": [
2374 "steppedLine": false,
2377 "expr": "go_goroutines{cluster=\"$cluster\",job=\"kubelet\", metrics_path=\"/metrics\",instance=~\"$instance\"}",
2378 "format": "time_series",
2379 "intervalFactor": 2,
2380 "legendFormat": "{{`{{`}}instance{{`}}`}}",
2389 "title": "Goroutines",
2393 "value_type": "individual"
2426 "repeatIteration": null,
2427 "repeatRowId": null,
2429 "title": "Dashboard Row",
2434 "schemaVersion": 14,
2448 "name": "datasource",
2452 "query": "prometheus",
2455 "type": "datasource"
2462 "datasource": "$datasource",
2463 "hide": {{ if .Values.grafana.sidecar.dashboards.multicluster }}0{{ else }}2{{ end }},
2464 "includeAll": false,
2471 "query": "label_values(kube_pod_info, cluster)",
2475 "tagValuesQuery": "",
2488 "datasource": "$datasource",
2497 "query": "label_values(kubelet_runtime_operations_total{cluster=\"$cluster\", job=\"kubelet\", metrics_path=\"/metrics\"}, instance)",
2501 "tagValuesQuery": "",
2516 "refresh_intervals": [
2541 "title": "Kubernetes / Kubelet",
2542 "uid": "3138fa155d5915769fbded898ac09fd9",