aboutsummaryrefslogtreecommitdiffstats
path: root/kubernetes/namespaces/monitoring/alerts/alerts.d/jobs.yaml
blob: fd163376e2b6ca6962284105cc45ccc7294795d0 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
groups:
- name: jobs
  rules:
  - alert: kubernetes/cronjob-suspended
    expr: kube_cronjob_spec_suspend != 0
    for: 0m
    labels:
      severity: page
    annotations:
      summary: "Kubernetes CronJob suspended: {{ $labels.cronjob }}"
      description: "CronJob {{ $labels.kubernetes_namespace }}/{{ $labels.cronjob }} is suspended"

  - alert: kubernetes/jobs-failed
    expr: kube_job_status_failed > 0
    for: 0m
    labels:
      severity: page
    annotations:
      summary: "Kubernetes Job failed: {{ $labels.job_name }}"
      description: "Job {{$labels.kubernetes_namespacenamespace}}/{{$labels.job_name}} failed to complete"