apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
creationTimestamp: “2020-07-20T11:06:19Z”
generation: 1
labels:
app: prometheus-operator
chart: prometheus-operator-8.13.2
heritage: Tiller
release: prometheus
name: prometheus-prometheus-oper-kubelet.rules
namespace: monitoring
resourceVersion: “306713214”
selfLink: /apis/monitoring.coreos.com/v1/namespaces/monitoring/prometheusrules/prometheus-prometheus-oper-kubelet.rules
uid: f45f0116-a73d-4a30-96cc-8bd7dd0fa7d5
spec:
groups:
- name: kubelet.rules
rules:- expr: histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_duration_seconds_bucket[5m]))
by (instance, le) * on(instance) group_left(node) kubelet_node_name{job=“kubelet”,
metrics_path="/metrics"})
labels:
quantile: “0.99”
record: node_quantile:kubelet_pleg_relist_duration_seconds:histogram_quantile - expr: histogram_quantile(0.9, sum(rate(kubelet_pleg_relist_duration_seconds_bucket[5m]))
by (instance, le) * on(instance) group_left(node) kubelet_node_name{job=“kubelet”,
metrics_path="/metrics"})
labels:
quantile: “0.9”
record: node_quantile:kubelet_pleg_relist_duration_seconds:histogram_quantile - expr: histogram_quantile(0.5, sum(rate(kubelet_pleg_relist_duration_seconds_bucket[5m]))
by (instance, le) * on(instance) group_left(node) kubelet_node_name{job=“kubelet”,
metrics_path="/metrics"})
labels:
quantile: “0.5”
record: node_quantile:kubelet_pleg_relist_duration_seconds:histogram_quantile
- expr: histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_duration_seconds_bucket[5m]))
irate(demo_server_data_gauge{instance=“10.233.99.128:9001”,host=“cpu Usage(%)”}[5m])
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
labels:
prometheus: k8s
role: alert-rules
app: prometheus-operator
chart: prometheus-operator-8.13.2
heritage: Tiller
release: prometheus
name: prometheus-prometheus-oper-basedata.rules
namespace: kubesphere-monitoring-system
spec:
groups:
- name: basedata.rules
rules:
- expr: |
irate(demo_server_data_gauge{instance="10.233.99.127:9001",host="cpu Usage(%)"}[5m]) > 0.81
for: 2m
labels:
severity: warning
998 vim /etc/alternatives/
999 ls
1000 kubectl get prometheus -n kubesphere-monitoring-system k8s-system -oyaml
1001 ls
1002 cd k8s/pod/prometheusRule/
1003 ls
1004 vim promtheusRule.yaml
1005 cat promtheusRule.yaml
1006 kubectl apply -f promtheusRule.yaml
1007 kubectl get svc -n kubesphere-monitoring-system
1008 kubectl get prometheus -n kubesphere-monitoring-system k8s-system -oyaml
1009 kubectl get pod -n kubesphere-monitoring-system
1010 kubectl get prometheus -n kubesphere-monitoring-system
1011 ls
1012 cat promtheusRule.yaml
irate(demo_server_data_gauge{host=“disk Usage(%)”,instance=“10.233.99.129:9001”}[60m])
kubectl edit PrometheusRule -n kubesphere-monitoring-system prometheus-k8s-rules
kubectl -n kubesphere-monitoring-system get prometheusrules prometheus-k8s-rules -oyaml
kubectl delete PrometheusRule prometheus-prometheus-oper-basedata.rules
kubectl delete -f promtheusRule.yaml
kubectl -n kubesphere-monitoring-system get prometheusrules prometheus-k8s-rules -oyaml
kubectl get PrometheusRule -n kubesphere-monitoring-system
kubectl edit PrometheusRule -n kubesphere-monitoring-system prometheus-k8s-rules
kubectl -n kubesphere-monitoring-system get prometheusrules prometheus-k8s-rules -oyaml
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
name: prometheus-prometheus-oper-basedata.rules
namespace: kubesphere-monitoring-system
labels:
prometheus: k8s
role: alert-rules
app: prometheus-operator
chart: prometheus-operator-8.13.2
heritage: Tiller
release: prometheus-operator
spec:
groups:
- name: basedata.rules
rules:
- alert: cpuUsageUnavailable
annotations:
description: my cpu goes down the cluster will be unavailable
expr: |
irate(demo_server_data_gauge{instance="10.233.99.128:9001",host="cpu Usage(%)"}[5m]) > 0.8
for: 2m
labels:
severity: warning
record: cpuUsage:demo_server_data_gauge:irate
- alert: diskUsageUnavailable
annotations:
description: my disk goes down the cluster will be unavailable
expr: |
irate(demo_server_data_gauge{instance="10.233.99.128:9001",host="disk Usage(%)"}[5m]) > 0.8
for: 2m
labels:
severity: warning
record: diskUsage:demo_server_data_gauge:irate
- alert: memUsageUnavailable
annotations:
description: my cpu goes down the cluster will be unavailable
expr: |
irate(demo_server_data_gauge{instance="10.233.99.128:9001",host="mem Usage(%)"}[5m]) > 0.8
for: 2m
labels:
severity: warning
record: memUsage:demo_server_data_gauge:irate
- alert: bytesSentUnavailable
annotations:
description: my cpu goes down the cluster will be unavailable
expr: |
irate(demo_server_data_gauge{instance="10.233.99.128:9001",host="bytes Sent"}[5m]) > 80
for: 2m
labels:
severity: warning
record: bytesSent:demo_server_data_gauge:irate