1 # Generated from 'node.rules' group from https://raw.githubusercontent.com/coreos/prometheus-operator/master/contrib/kube-prometheus/manifests/prometheus-rules.yaml
2 {{- if and .Values.defaultRules.create .Values.nodeExporter.enabled }}
3 apiVersion: {{ printf "%s/v1" (.Values.prometheusOperator.crdApiGroup | default "monitoring.coreos.com") }}
6 name: {{ printf "%s-%s" (include "prometheus-operator.fullname" .) "node.rules" | trunc 63 | trimSuffix "-" }}
8 app: {{ template "prometheus-operator.name" . }}
9 {{ include "prometheus-operator.labels" . | indent 4 }}
10 {{- if .Values.defaultRules.labels }}
11 {{ toYaml .Values.defaultRules.labels | indent 4 }}
13 {{- if .Values.defaultRules.annotations }}
15 {{ toYaml .Values.defaultRules.annotations | indent 4 }}
21 - expr: sum(min(kube_pod_info) by (node))
22 record: ':kube_pod_info_node_count:'
23 - expr: max(label_replace(kube_pod_info{job="kube-state-metrics"}, "pod", "$1", "pod", "(.*)")) by (node, namespace, pod)
24 record: 'node_namespace_pod:kube_pod_info:'
26 count by (node) (sum by (node, cpu) (
27 node_cpu_seconds_total{job="node-exporter"}
28 * on (namespace, pod) group_left(node)
29 node_namespace_pod:kube_pod_info:
31 record: node:node_num_cpu:sum
32 - expr: 1 - avg(rate(node_cpu_seconds_total{job="node-exporter",mode="idle"}[1m]))
33 record: :node_cpu_utilisation:avg1m
36 rate(node_cpu_seconds_total{job="node-exporter",mode="idle"}[1m])
37 * on (namespace, pod) group_left(node)
38 node_namespace_pod:kube_pod_info:)
39 record: node:node_cpu_utilisation:avg1m
41 sum(node_load1{job="node-exporter"})
43 sum(node:node_num_cpu:sum)
44 record: ':node_cpu_saturation_load1:'
47 node_load1{job="node-exporter"}
48 * on (namespace, pod) group_left(node)
49 node_namespace_pod:kube_pod_info:
53 record: 'node:node_cpu_saturation_load1:'
56 sum(node_memory_MemFree_bytes{job="node-exporter"} + node_memory_Cached_bytes{job="node-exporter"} + node_memory_Buffers_bytes{job="node-exporter"})
58 sum(node_memory_MemTotal_bytes{job="node-exporter"})
59 record: ':node_memory_utilisation:'
60 - expr: sum(node_memory_MemFree_bytes{job="node-exporter"} + node_memory_Cached_bytes{job="node-exporter"} + node_memory_Buffers_bytes{job="node-exporter"})
61 record: :node_memory_MemFreeCachedBuffers_bytes:sum
62 - expr: sum(node_memory_MemTotal_bytes{job="node-exporter"})
63 record: :node_memory_MemTotal_bytes:sum
66 (node_memory_MemFree_bytes{job="node-exporter"} + node_memory_Cached_bytes{job="node-exporter"} + node_memory_Buffers_bytes{job="node-exporter"})
67 * on (namespace, pod) group_left(node)
68 node_namespace_pod:kube_pod_info:
70 record: node:node_memory_bytes_available:sum
73 node_memory_MemTotal_bytes{job="node-exporter"}
74 * on (namespace, pod) group_left(node)
75 node_namespace_pod:kube_pod_info:
77 record: node:node_memory_bytes_total:sum
79 (node:node_memory_bytes_total:sum - node:node_memory_bytes_available:sum)
81 scalar(sum(node:node_memory_bytes_total:sum))
82 record: node:node_memory_utilisation:ratio
85 (rate(node_vmstat_pgpgin{job="node-exporter"}[1m])
86 + rate(node_vmstat_pgpgout{job="node-exporter"}[1m]))
88 record: :node_memory_swap_io_bytes:sum_rate
92 (node_memory_MemFree_bytes{job="node-exporter"} + node_memory_Cached_bytes{job="node-exporter"} + node_memory_Buffers_bytes{job="node-exporter"})
93 * on (namespace, pod) group_left(node)
94 node_namespace_pod:kube_pod_info:
98 node_memory_MemTotal_bytes{job="node-exporter"}
99 * on (namespace, pod) group_left(node)
100 node_namespace_pod:kube_pod_info:
102 record: 'node:node_memory_utilisation:'
103 - expr: 1 - (node:node_memory_bytes_available:sum / node:node_memory_bytes_total:sum)
104 record: 'node:node_memory_utilisation_2:'
106 1e3 * sum by (node) (
107 (rate(node_vmstat_pgpgin{job="node-exporter"}[1m])
108 + rate(node_vmstat_pgpgout{job="node-exporter"}[1m]))
109 * on (namespace, pod) group_left(node)
110 node_namespace_pod:kube_pod_info:
112 record: node:node_memory_swap_io_bytes:sum_rate
113 - expr: avg(irate(node_disk_io_time_seconds_total{job="node-exporter",device=~"nvme.+|rbd.+|sd.+|vd.+|xvd.+"}[1m]))
114 record: :node_disk_utilisation:avg_irate
117 irate(node_disk_io_time_seconds_total{job="node-exporter",device=~"nvme.+|rbd.+|sd.+|vd.+|xvd.+"}[1m])
118 * on (namespace, pod) group_left(node)
119 node_namespace_pod:kube_pod_info:
121 record: node:node_disk_utilisation:avg_irate
122 - expr: avg(irate(node_disk_io_time_weighted_seconds_total{job="node-exporter",device=~"nvme.+|rbd.+|sd.+|vd.+|xvd.+"}[1m]) / 1e3)
123 record: :node_disk_saturation:avg_irate
126 irate(node_disk_io_time_weighted_seconds_total{job="node-exporter",device=~"nvme.+|rbd.+|sd.+|vd.+|xvd.+"}[1m]) / 1e3
127 * on (namespace, pod) group_left(node)
128 node_namespace_pod:kube_pod_info:
130 record: node:node_disk_saturation:avg_irate
132 max by (namespace, pod, device) ((node_filesystem_size_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"}
133 - node_filesystem_avail_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"})
134 / node_filesystem_size_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"})
135 record: 'node:node_filesystem_usage:'
136 - expr: max by (namespace, pod, device) (node_filesystem_avail_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"} / node_filesystem_size_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"})
137 record: 'node:node_filesystem_avail:'
139 sum(irate(node_network_receive_bytes_total{job="node-exporter",device="eth0"}[1m])) +
140 sum(irate(node_network_transmit_bytes_total{job="node-exporter",device="eth0"}[1m]))
141 record: :node_net_utilisation:sum_irate
144 (irate(node_network_receive_bytes_total{job="node-exporter",device="eth0"}[1m]) +
145 irate(node_network_transmit_bytes_total{job="node-exporter",device="eth0"}[1m]))
146 * on (namespace, pod) group_left(node)
147 node_namespace_pod:kube_pod_info:
149 record: node:node_net_utilisation:sum_irate
151 sum(irate(node_network_receive_drop_total{job="node-exporter",device="eth0"}[1m])) +
152 sum(irate(node_network_transmit_drop_total{job="node-exporter",device="eth0"}[1m]))
153 record: :node_net_saturation:sum_irate
156 (irate(node_network_receive_drop_total{job="node-exporter",device="eth0"}[1m]) +
157 irate(node_network_transmit_drop_total{job="node-exporter",device="eth0"}[1m]))
158 * on (namespace, pod) group_left(node)
159 node_namespace_pod:kube_pod_info:
161 record: node:node_net_saturation:sum_irate
165 kube_pod_info{job="kube-state-metrics", host_ip!=""}
167 * on (host_ip) group_right (node)
169 (max(node_filesystem_files{job="node-exporter", mountpoint="/"}) by (instance)), "host_ip", "$1", "instance", "(.*):.*"
172 record: 'node:node_inodes_total:'
176 kube_pod_info{job="kube-state-metrics", host_ip!=""}
178 * on (host_ip) group_right (node)
180 (max(node_filesystem_files_free{job="node-exporter", mountpoint="/"}) by (instance)), "host_ip", "$1", "instance", "(.*):.*"
183 record: 'node:node_inodes_free:'