Compare commits

..

1 Commits

Author SHA1 Message Date
Laurent Gourvenec 45c97c765b augmentation du seuil d'alerte température CPU 2024-05-30 11:44:13 +02:00
1 changed files with 1 additions and 11 deletions

View File

@ -34,25 +34,15 @@ groups:
- alert: filesystem_threshold_exceeded
expr: node_filesystem_avail{job="%%{job_name_node}",mountpoint="/"} / node_filesystem_size{job="%%{job_name_node}"}
* 100 < 20
for: 2m
annotations:
description: This device's filesystem usage has exceeded the threshold with
a value of {{ $value }}.
summary: Instance {{ $labels.instance }} filesystem usage is dangerously high
# Heavy "/var" use
- alert: var_filesystem_threshold_exceeded
expr: node_filesystem_avail{job="node",mountpoint="/var"} / node_filesystem_size{job="node"}
* 100 < 20
annotations:
description: This device's filesystem usage has exceeded the threshold with
a value of {{ $value }}.
summary: Instance {{ $labels.instance }} filesystem usage is dangerously high
# Heavy CPU temperature
- alert: cpu_temp_threshold_exceeded
expr: avg(node_hwmon_temp_celsius{job="node"}) BY (instance)
> 50
> 70
annotations:
description: This device's cpu temperature has exceeded the threshold with a value
of {{ $value }}.