- 1分钟内文件没有恢复告警
root@monitor-alarm:/usr/local/prometheus/prometheus# cat alert.rules.yml
groups:
- name: alert.rules
rules:
- alert: cpu_usage_over_threshold
expr: 100 - avg(irate(node_cpu_seconds_total{
mode="idle"}[1m])) by (alarmhost) * 100 > 90
# Alarm duration
for: 60s
label:
severity: "critical"
annotatio