From efb9fa9194ff5f70fe027b945787cbc34293db05 Mon Sep 17 00:00:00 2001 From: Johannes Christ Date: Mon, 26 Aug 2024 17:49:22 +0200 Subject: Install prometheus-postfix-exporter As a data-obsessed administrator I want to have more data such that I can widen my sense of power. This also installs rsyslog, because prometheus-postfix-exporter doesn't work with journald's binary log format. --- .../monitoring/alerts/alerts.d/mail.yaml | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) create mode 100644 kubernetes/namespaces/monitoring/alerts/alerts.d/mail.yaml (limited to 'kubernetes/namespaces') diff --git a/kubernetes/namespaces/monitoring/alerts/alerts.d/mail.yaml b/kubernetes/namespaces/monitoring/alerts/alerts.d/mail.yaml new file mode 100644 index 0000000..39f6a3e --- /dev/null +++ b/kubernetes/namespaces/monitoring/alerts/alerts.d/mail.yaml @@ -0,0 +1,22 @@ +groups: + - name: postfix + rules: + - alert: postfix/down + expr: postfix_up != 1 + for: 5m + labels: + severity: warning + annotations: + summary: Postfix is down (instance {{ $labels.instance }}) + - alert: postfix/smtp-temporary-errors + expr: rate(postfix_smtpd_messages_rejected_total{code=~"^4.*"}[15m]) > 0 + for: 0m + labels: + severity: warning + annotations: + summary: Postfix is rejecting messages due to errors (instance {{ $labels.instance }}) + description: Postfix has seen code {{ $labels.code }} errors recently + and temporarily rejected emails. + https://en.wikipedia.org/wiki/List_of_SMTP_server_return_codes and + `sudo journalctl -xeu postfix@-` may provide more information on + the current issue. -- cgit v1.2.3