groups:
- name: node.rules
rules:
- alert: NodeDiskUsage
expr: 100 -node_filesystem_free_bytes{fstype=~"xfs|ext4"} /node_filesystem_size_bytes{fstype=~"xfs|ext4"} *100 > 80
for: 20m
labels:
severity: warning
annotations:
summary: "Instance {{ $labels.instance }} : {{ $labels.mounpoint }} 分区使用率过高"
description: "{{ $labels.instance }} {{ $labels.mounpoint }} 分区使用大于80% (当前值: {{ $value }})"
- alert: NodeMemoryUsage
expr: 100-(node_memory_MemFree_bytes+node_memory_Cached_bytes+node_memory_Buffers_bytes) /node_memory_MemTotal_bytes*100 > 80
for: 20m
labels:
severity: warning
annotations:
summary: "Instance {{ $labels.instance }} : 内存使用率过高"
description: "{{ $labels.instance }} 内存使用大于80% (当前值: {{ $value }})"
- alert: NodeCpuUsage
expr: 100 - avg(irate(node_cpu_seconds_total{mode="idle"}[1m])) by(instance)*100 > 60
for: 20m
labels:
severity: warning
annotations:
summary: "Instance {{ $labels.instance }} : CPU使用率过高"
description: "{{ $labels.instance }} CPU使用大于60% (当前值: {{ $value }})"
Alertmanager告警规则之—Linux基础资源
最新推荐文章于 2024-02-04 10:26:29 发布