From 49f08e26f12309d5eb5a59ceffef850b52feac7d Mon Sep 17 00:00:00 2001 From: icecheng Date: Wed, 24 Sep 2025 17:18:18 +0800 Subject: [PATCH 1/2] update alertmanager config --- altermanager/alertmanager-config.yaml | 15 ++++++++++----- 1 file changed, 10 insertions(+), 5 deletions(-) diff --git a/altermanager/alertmanager-config.yaml b/altermanager/alertmanager-config.yaml index 3d712acb..f37df70c 100644 --- a/altermanager/alertmanager-config.yaml +++ b/altermanager/alertmanager-config.yaml @@ -37,16 +37,21 @@ spec: sendResolved: true headers: - key: Subject - value: '🚨Freeleaps Alert: {{ .CommonAnnotations.summary }}' + value: '{{ if eq .Status "firing" }}🚨 Freeleaps Alert: {{ .CommonAnnotations.summary }}{{ else }}βœ… Freeleaps Resolved: {{ .CommonAnnotations.summary }}{{ end }}' html: |- +

{{ if eq .Status "firing" }}🚨 Alert: {{ .CommonAnnotations.summary }}{{ else }}βœ… Resolved: {{ .CommonAnnotations.summary }}{{ end }}

+

πŸ“ AlertName: {{ .CommonLabels.alertname }}

+

πŸ”§ Service: {{ .CommonLabels.service }}

+

πŸ”§ Pod: {{ .CommonLabels.pod }}({{ .CommonLabels.instance }})

+

🏷️ Severity: {{ .CommonLabels.severity }}

+

{{ if eq .Status "firing" }}πŸ”΄ Status:{{ else }}🟒 Status:{{ end }} {{ .Status | toUpper }}

πŸ“ Description: {{ .CommonAnnotations.description }}

-

{{ if eq .Status "firing" }}πŸ”΄ Status: {{ .Status | toUpper }}{{ else }}🟒 Status: {{ .Status | toUpper }}{{ end }}

πŸ“– Runbook: {{ .CommonAnnotations.runbook_url }}

name: email route: groupBy: - severity - groupInterval: 30s + groupInterval: 5m receiver: email - groupWait: 30s - repeatInterval: 1m + groupWait: 5m + repeatInterval: 6h From 07a0af3a357049560941db842e48abd6e6d3a34c Mon Sep 17 00:00:00 2001 From: icecheng Date: Wed, 24 Sep 2025 18:24:21 +0800 Subject: [PATCH 2/2] feat: add namespace in metrics alert --- altermanager/alertmanager-config.yaml | 4 ++-- freeleaps/helm-pkg/metrics/values.prod.yaml | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/altermanager/alertmanager-config.yaml b/altermanager/alertmanager-config.yaml index f37df70c..8064fc95 100644 --- a/altermanager/alertmanager-config.yaml +++ b/altermanager/alertmanager-config.yaml @@ -3,7 +3,7 @@ kind: Secret type: Opaque metadata: name: altermanager-email-credentials - namespace: freeleaps-monitoring-system + namespace: freeleaps-prod data: password: cHducGNya3d0aXp5Z2RoZQ== --- @@ -11,7 +11,7 @@ apiVersion: monitoring.coreos.com/v1alpha1 kind: AlertmanagerConfig metadata: name: alertmanager-config - namespace: freeleaps-monitoring-system + namespace: freeleaps-prod spec: receivers: # - msteamsConfigs: diff --git a/freeleaps/helm-pkg/metrics/values.prod.yaml b/freeleaps/helm-pkg/metrics/values.prod.yaml index 7327084e..b1f6f443 100644 --- a/freeleaps/helm-pkg/metrics/values.prod.yaml +++ b/freeleaps/helm-pkg/metrics/values.prod.yaml @@ -94,7 +94,7 @@ metrics: labels: severity: critical service: metrics-service - namespace: freeleaps-monitoring-system + namespace: freeleaps-prod annotations: summary: Freeleaps Metrics service is down (instance {{ $labels.instance }}) description: Freeleaps Metrics service has been down for more than 1 minutes. @@ -105,7 +105,7 @@ metrics: labels: severity: warning service: metrics-service - namespace: freeleaps-monitoring-system + namespace: freeleaps-prod annotations: summary: High error rate in freeleaps metrics service (instance {{ $labels.instance }}) description: Freeleaps Metrics service error rate is {{ $value }} errors per second.