| Rule |
State |
Error |
Last Evaluation |
Evaluation Time |
| alert: HighCpuUsage
expr: (1
- instance:node_cpu_seconds_total:avg_rate5m{job="node",mode="idle"})
* 100 > 90
for: 5m
labels:
severity: info
annotations:
description: The CPU usage in {{ $labels.instance }} has been over 90% for more
than 5 minutes.
generic_summary: CPU usage too high
summary: CPU usage in {{ $labels.instance }} is too high
|
ok
|
|
15.475s ago
|
457.5us |
| alert: HighLoadAvg
expr: node_load15{job="node"}
> 100
for: 5m
labels:
severity: info
annotations:
description: The 15-minute load average in {{ $labels.instance }} has been over
100 for more than 5 minutes.
generic_summary: Load average too high
summary: The load average in {{ $labels.instance }} is too high
|
ok
|
|
15.475s ago
|
207.6us |
| alert: MemFull
expr: instance:node_memory_MemUsed_bytes_per_node_memory_MemTotal_bytes:ratio{job="node"}
* 100 > 90
for: 15m
labels:
severity: info
annotations:
description: The memory usage in {{ $labels.instance }} has been over 90% for more
than 15 minutes.
generic_summary: Memory usage too high
summary: Memory usage in {{ $labels.instance }} is too high
|
ok
|
|
15.475s ago
|
200us |
| alert: MemFull
expr: instance:node_memory_MemUsed_bytes_per_node_memory_MemTotal_bytes:ratio{job="node"}
* 100 > 95
for: 5m
labels:
severity: warning
annotations:
description: The memory usage in {{ $labels.instance }} has been over 95% for more
than 5 minutes.
generic_summary: Memory usage critical
summary: Memory usage in {{ $labels.instance }} is critical
|
ok
|
|
15.475s ago
|
186.9us |
| alert: FSFull
expr: instance:node_filesystem_avail_bytes_per_node_filesystem_size_bytes:ratio{job="node"}
* 100 <= 1
for: 5m
labels:
severity: warning
annotations:
description: The {{ $labels.mountpoint }} filesystem in {{ $labels.instance }} has
less than 5% available space.
generic_summary: Filesystem almost full
summary: Filesystem {{ $labels.mountpoint }} in {{ $labels.instance }} is almost
full
|
ok
|
|
15.475s ago
|
667.7us |
| alert: FSFull
expr: instance:node_filesystem_avail_bytes_per_node_filesystem_size_bytes:ratio{job="node"}
* 100 <= 0.5
for: 5m
labels:
severity: critical
annotations:
description: The {{ $labels.mountpoint }} filesystem in {{ $labels.instance }} is
full.
generic_summary: Filesystem full
summary: Filesystem {{ $labels.mountpoint }} in {{ $labels.instance }} is full
|
ok
|
|
15.474s ago
|
557.1us |
| alert: FSFullSoon
expr: predict_linear(instance:node_filesystem_avail_bytes:sum{job="node"}[12h],
24 * 3600) <= 0
for: 5m
labels:
severity: info
annotations:
description: The {{ $labels.mountpoint }} filesystem in {{ $labels.instance }} will
be full in 24 hours at the current rate.
generic_summary: Filesystem full soon
summary: Filesystem {{ $labels.mountpoint }} in {{ $labels.instance }} will fill
soon
|
ok
|
|
15.474s ago
|
9.728ms |
| alert: FSFullSoon
expr: predict_linear(instance:node_filesystem_avail_bytes:sum{job="node"}[4h],
4 * 3600) <= 0
for: 30m
labels:
severity: warning
annotations:
description: The {{ $labels.mountpoint }} filesystem in {{ $labels.instance }} will
be full in 4 hours at the current rate.
generic_summary: Filesystem full VERY soon
summary: Filesystem {{ $labels.mountpoint }} in {{ $labels.instance }} will fill
VERY soon
|
ok
|
|
15.464s ago
|
3.731ms |
| alert: MemFullSoon
expr: predict_linear(instance:node_memory_MemUsed_bytes_per_node_memory_MemTotal_bytes:ratio{job="node"}[12h],
24 * 3600) * 100 > 99
for: 5m
labels:
severity: info
annotations:
description: The memory usage in {{ $labels.instance }} in {{ $labels.instance }}
will reach 100% in 24 hours at the current rate.
generic_summary: Memory full soon
summary: Memory in {{ $labels.instance }} will fill in 24h
|
ok
|
|
15.46s ago
|
2.743ms |
| alert: MemFullSoon
expr: predict_linear(instance:node_memory_MemUsed_bytes_per_node_memory_MemTotal_bytes:ratio{job="node"}[8h],
4 * 3600) * 100 > 99
for: 30m
labels:
severity: warning
annotations:
description: The memory usage in {{ $labels.instance }} in {{ $labels.instance }}
will reach 100% in 4 hours at the current rate.
generic_summary: Memory full VERY soon
summary: Memory in {{ $labels.instance }} will fill in 4h
|
ok
|
|
15.458s ago
|
1.927ms |
| alert: ProcessNearFDLimits
expr: process_open_fds
/ process_max_fds * 100 > 80
for: 5m
labels:
severity: warning
annotations:
description: The process for {{ $labels.job }} in {{ $labels.instance }} has {{
$value }}% of available file descriptors in use.
generic_summary: Too many files open
summary: The process in {{ $labels.instance }} has too many files open.
|
ok
|
|
15.456s ago
|
499.3us |
|
26.975s ago |
944.4us |
| Rule |
State |
Error |
Last Evaluation |
Evaluation Time |
| record: instance:node_memory_MemTotal_bytes:sum
expr: node_memory_MemTotal_bytes{job="node"}
|
ok
|
|
9.507s ago
|
387us |
| record: instance:node_memory_MemFree_bytes:sum
expr: node_memory_MemFree_bytes{job="node"}
|
ok
|
|
9.506s ago
|
206.5us |
| record: instance:node_memory_MemUsed_bytes:sum
expr: node_memory_MemTotal_bytes{job="node"}
- node_memory_MemFree_bytes{job="node"} - node_memory_Buffers_bytes{job="node"}
- node_memory_Cached_bytes{job="node"}
|
ok
|
|
9.506s ago
|
1.061ms |
| record: instance:node_memory_MemUsed_bytes_per_node_memory_MemTotal_bytes:ratio
expr: instance:node_memory_MemUsed_bytes:sum{job="node"}
/ instance:node_memory_MemTotal_bytes:sum{job="node"}
|
ok
|
|
9.505s ago
|
488.2us |
| record: instance:node_cpu_seconds_total:rate5m
expr: rate(node_cpu_seconds_total{job="node"}[5m])
|
ok
|
|
9.505s ago
|
8.239ms |
| record: instance:node_cpu_seconds_total:avg_rate5m
expr: avg
without (cpu) (rate(node_cpu_seconds_total{job="node"}[5m]))
|
ok
|
|
9.497s ago
|
6.57ms |
| record: instance:node_network_receive_bytes_total:rate5m
expr: rate(node_network_receive_bytes_total{job="node"}[5m])
|
ok
|
|
9.49s ago
|
880.2us |
| record: instance:node_network_receive_drop_total:rate5m
expr: rate(node_network_receive_drop_total{job="node"}[5m])
|
ok
|
|
9.489s ago
|
822.7us |
| record: instance:node_network_receive_errs_total:rate5m
expr: rate(node_network_receive_errs_total{job="node"}[5m])
|
ok
|
|
9.489s ago
|
765.1us |
| record: instance:node_network_receive_packets_total:rate5m
expr: rate(node_network_receive_packets_total{job="node"}[5m])
|
ok
|
|
9.488s ago
|
900.6us |
| record: instance:node_network_transmit_bytes_total:rate5m
expr: rate(node_network_transmit_bytes_total{job="node"}[5m])
|
ok
|
|
9.487s ago
|
878.4us |
| record: instance:node_network_transmit_drop_total:rate5m
expr: rate(node_network_transmit_drop_total{job="node"}[5m])
|
ok
|
|
9.486s ago
|
792.8us |
| record: instance:node_network_transmit_errs_total:rate5m
expr: rate(node_network_transmit_errs_total{job="node"}[5m])
|
ok
|
|
9.485s ago
|
733.7us |
| record: instance:node_network_transmit_packets_total:rate5m
expr: rate(node_network_transmit_packets_total{job="node"}[5m])
|
ok
|
|
9.485s ago
|
815.4us |
| record: instance:node_disk_io_time_seconds_total:rate5m
expr: rate(node_disk_io_time_seconds_total{job="node"}[5m])
|
ok
|
|
9.484s ago
|
1.077ms |
| record: instance:node_disk_read_bytes_total:rate5m
expr: rate(node_disk_read_bytes_total{job="node"}[5m])
|
ok
|
|
9.483s ago
|
923.4us |
| record: instance:node_disk_written_bytes_total:rate5m
expr: rate(node_disk_written_bytes_total{job="node"}[5m])
|
ok
|
|
9.482s ago
|
1.059ms |
| record: instance:node_filesystem_avail_bytes:sum
expr: node_filesystem_avail_bytes{job="node"}
|
ok
|
|
9.481s ago
|
618.1us |
| record: instance:node_filesystem_free_bytes:sum
expr: node_filesystem_free_bytes{job="node"}
|
ok
|
|
9.481s ago
|
568.5us |
| record: instance:node_filesystem_size_bytes:sum
expr: node_filesystem_size_bytes{job="node"}
|
ok
|
|
9.48s ago
|
616.6us |
| record: instance:node_filesystem_avail_bytes_per_node_filesystem_size_bytes:ratio
expr: node_filesystem_avail_bytes{job="node"}
/ node_filesystem_size_bytes{job="node"}
|
ok
|
|
9.48s ago
|
1.037ms |
| record: instance:node_filesystem_free_bytes_per_node_filesystem_size_bytes:ratio
expr: node_filesystem_free_bytes{job="node"}
/ node_filesystem_size_bytes{job="node"}
|
ok
|
|
9.479s ago
|
1.058ms |
| record: instance:node_filesystem_files:sum
expr: node_filesystem_files{job="node"}
|
ok
|
|
9.478s ago
|
537.2us |
| record: instance:node_filesystem_files_free:sum
expr: node_filesystem_files_free{job="node"}
|
ok
|
|
9.477s ago
|
511.4us |
| record: instance:node_filesystem_files_free_per_node_filesystem_files:ratio
expr: node_filesystem_files_free{job="node"}
/ node_filesystem_files{job="node"}
|
ok
|
|
9.477s ago
|
988.2us |