feat(monitoring): regras de alerta Athletic Map

This commit is contained in:
ATM Platform
2026-06-16 21:35:39 +00:00
parent e537ee274d
commit f05867234c
+8 -5
View File
@@ -3,7 +3,8 @@ kind: PrometheusRule
metadata:
name: athleticmap-rules
namespace: monitoring
labels: { release: monitoring }
labels:
release: monitoring
spec:
groups:
- name: athleticmap.backup
@@ -11,14 +12,16 @@ spec:
- alert: AthleticMapBackupStale
expr: time() - kube_cronjob_status_last_successful_time{cronjob="pg-backup"} > 93600
for: 15m
labels: { severity: warning }
labels:
severity: warning
annotations:
summary: "Backup do tenant {{ \.namespace }} sem sucesso ha >26h"
summary: "Backup do tenant {{ $labels.namespace }} sem sucesso ha mais de 26h"
- name: athleticmap.health
rules:
- alert: AthleticMapTenantPodNotReady
expr: kube_pod_status_ready{namespace=~".*-prod", condition="true"} == 0
for: 10m
labels: { severity: warning }
labels:
severity: warning
annotations:
summary: "Pod {{ \.pod }} ({{ \.namespace }}) nao-Ready ha >10m"
summary: "Pod {{ $labels.pod }} em {{ $labels.namespace }} nao-Ready ha mais de 10m"