feat: add postgres/gitea/blackbox alerts and more node alerts
This commit is contained in:
19
environments/dev/adibrov/alerts/node/node_high_load.yaml
Normal file
19
environments/dev/adibrov/alerts/node/node_high_load.yaml
Normal file
@ -0,0 +1,19 @@
|
||||
name: "DEV ADIBROV - High System Load"
|
||||
expression: |
|
||||
node_load5{job="node_exporter"} / on(instance) machine_cpu_cores{job="cadvisor"}
|
||||
threshold: 2
|
||||
for: "10m"
|
||||
condition_type: "gt"
|
||||
need_reduce: true
|
||||
reducer_type: "max"
|
||||
no_data_state: "OK"
|
||||
exec_err_state: "Error"
|
||||
labels:
|
||||
service: "system"
|
||||
severity: "warning"
|
||||
team: "infra"
|
||||
summary: |
|
||||
Высокий LA на {{ $labels.instance }}: {{ printf "%.2f" $values.B.Value }} на ядро
|
||||
description: |
|
||||
Средняя нагрузка (load average 5m) на {{ $labels.instance }} превышает 2x количество ядер CPU.
|
||||
Система перегружена — процессы ждут в очереди на выполнение.
|
||||
Reference in New Issue
Block a user