diff options
Diffstat (limited to 'kubernetes')
| -rw-r--r-- | kubernetes/namespaces/monitoring/alerts/alerts.d/mail.yaml | 22 | 
1 files changed, 22 insertions, 0 deletions
| diff --git a/kubernetes/namespaces/monitoring/alerts/alerts.d/mail.yaml b/kubernetes/namespaces/monitoring/alerts/alerts.d/mail.yaml new file mode 100644 index 0000000..39f6a3e --- /dev/null +++ b/kubernetes/namespaces/monitoring/alerts/alerts.d/mail.yaml @@ -0,0 +1,22 @@ +groups: +  - name: postfix +    rules: +      - alert: postfix/down +        expr: postfix_up != 1 +        for: 5m +        labels: +          severity: warning +        annotations: +          summary: Postfix is down (instance {{ $labels.instance }}) +      - alert: postfix/smtp-temporary-errors +        expr: rate(postfix_smtpd_messages_rejected_total{code=~"^4.*"}[15m]) > 0 +        for: 0m +        labels: +          severity: warning +        annotations: +          summary: Postfix is rejecting messages due to errors (instance {{ $labels.instance }}) +          description: Postfix has seen code {{ $labels.code }} errors recently +            and temporarily rejected emails. +            https://en.wikipedia.org/wiki/List_of_SMTP_server_return_codes and +            `sudo journalctl -xeu postfix@-` may provide more information on +            the current issue. | 
