feat: add postgres/gitea/blackbox alerts and more node alerts
This commit is contained in:
21
environments/dev/adibrov/alerts/node/node_high_cpu.yaml
Normal file
21
environments/dev/adibrov/alerts/node/node_high_cpu.yaml
Normal file
@ -0,0 +1,21 @@
|
||||
name: "DEV ADIBROV - High CPU Usage"
|
||||
expression: |
|
||||
(
|
||||
1 - avg by(instance) (rate(node_cpu_seconds_total{job="node_exporter", mode="idle"}[5m]))
|
||||
) * 100
|
||||
threshold: 85
|
||||
for: "5m"
|
||||
condition_type: "gt"
|
||||
need_reduce: true
|
||||
reducer_type: "max"
|
||||
no_data_state: "OK"
|
||||
exec_err_state: "Error"
|
||||
labels:
|
||||
service: "system"
|
||||
severity: "warning"
|
||||
team: "infra"
|
||||
summary: |
|
||||
Высокая нагрузка CPU: {{ printf "%.0f" $values.B.Value }}% на {{ $labels.instance }}
|
||||
description: |
|
||||
Использование CPU на {{ $labels.instance }} превышает 85% на протяжении 5 минут.
|
||||
Это может привести к деградации производительности всех сервисов на хосте.
|
||||
Reference in New Issue
Block a user