ajout surveillance /var
This commit is contained in:
parent
43e34f8de8
commit
4ef331f6a1
|
@ -34,11 +34,21 @@ groups:
|
|||
- alert: filesystem_threshold_exceeded
|
||||
expr: node_filesystem_avail{job="%%{job_name_node}",mountpoint="/"} / node_filesystem_size{job="%%{job_name_node}"}
|
||||
* 100 < 20
|
||||
for: 2m
|
||||
annotations:
|
||||
description: This device's filesystem usage has exceeded the threshold with
|
||||
a value of {{ $value }}.
|
||||
summary: Instance {{ $labels.instance }} filesystem usage is dangerously high
|
||||
|
||||
# Heavy "/var" use
|
||||
- alert: var_filesystem_threshold_exceeded
|
||||
expr: node_filesystem_avail{job="node",mountpoint="/var"} / node_filesystem_size{job="node"}
|
||||
* 100 < 20
|
||||
annotations:
|
||||
description: This device's filesystem usage has exceeded the threshold with
|
||||
a value of {{ $value }}.
|
||||
summary: Instance {{ $labels.instance }} filesystem usage is dangerously high
|
||||
|
||||
# Heavy CPU temperature
|
||||
- alert: cpu_temp_threshold_exceeded
|
||||
expr: avg(node_hwmon_temp_celsius{job="node"}) BY (instance)
|
||||
|
|
Loading…
Reference in New Issue