1、监控网站延迟规则
[root@master ~]# cat web-rule.yaml
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
labels:
app.kubernetes.io/component: exporter
app.kubernetes.io/name: blackbox-exporter
prometheus: k8s
role: alert-rules
name: blackbox
namespace: kuboard
spec:
groups:
- name: blackbox-exporter
rules:
- alert: DomainAccessDelayExceeds1s
annotations:
description: 域名 {{ $labels.instance }} 检测延迟大于1秒, 当前值为 {{ $value }}
summary: 域名探测,访问延迟超过1秒
expr: sum(probe_http_duration_seconds{job=~"blackbox"}) by (instance) > 1
for: 1m
labels:
severity: warring
type: blackbox
说明:以上配置为当网站延迟大于1秒是就告警
2、监控MySql服务是否正常规则
[root@master ~]# cat mysql-rule.yaml
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
labels:
app.kubernetes.io/component: exporter
app.kubernetes.io/name: mysql-exporter
prometheus: k8s
role: alert-rules
name: mysql
namespace: kuboard
spec:
groups:
- name: mysql-exporter
rules:
- alert: MySqlDown
annotations:
description: mysql {{ $labels.instance }} 挂了
summary: mysql无法访问
expr: mysql_up = 0
for: 1m
labels:
severity: warring
type: database
说明“ 当 mysql_up = 0 的时候说明mysql服务挂了,需要及时处理