aboutsummaryrefslogtreecommitdiffstats
path: root/kubernetes/namespaces/monitoring/alerts/alerts.d/coredns.yaml
blob: eeb56ec050f7df411bd136c3ab020f9798e231ca (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
groups:
- name: coredns
  rules:

  - alert: core-dns/panics
    expr: increase(coredns_panics_total[1m]) > 0
    for: 0m
    labels:
      severity: page
    annotations:
      summary: "CoreDNS is experiencing panic"
      description: "Number of CoreDNS panics encountered: {{ $value }}"

  - alert: core-dns/cache-misses
    expr: rate(coredns_cache_misses_total{}[10m]) / rate(coredns_cache_misses_total{}[10m] offset 10m) > 5.00
    for: 2h
    labels:
      severity: page
    annotations:
      summary: "High CoreDNS cache misses in last 2 hours"
      description: "This can sometimes be an indication of networking troubles, currently {{ $value | humanizePercentage }} over last 2 hours."