feat(monitoring): regras de alerta Athletic Map
This commit is contained in:
@@ -3,7 +3,8 @@ kind: PrometheusRule
|
||||
metadata:
|
||||
name: athleticmap-rules
|
||||
namespace: monitoring
|
||||
labels: { release: monitoring }
|
||||
labels:
|
||||
release: monitoring
|
||||
spec:
|
||||
groups:
|
||||
- name: athleticmap.backup
|
||||
@@ -11,14 +12,16 @@ spec:
|
||||
- alert: AthleticMapBackupStale
|
||||
expr: time() - kube_cronjob_status_last_successful_time{cronjob="pg-backup"} > 93600
|
||||
for: 15m
|
||||
labels: { severity: warning }
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "Backup do tenant {{ \.namespace }} sem sucesso ha >26h"
|
||||
summary: "Backup do tenant {{ $labels.namespace }} sem sucesso ha mais de 26h"
|
||||
- name: athleticmap.health
|
||||
rules:
|
||||
- alert: AthleticMapTenantPodNotReady
|
||||
expr: kube_pod_status_ready{namespace=~".*-prod", condition="true"} == 0
|
||||
for: 10m
|
||||
labels: { severity: warning }
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "Pod {{ \.pod }} ({{ \.namespace }}) nao-Ready ha >10m"
|
||||
summary: "Pod {{ $labels.pod }} em {{ $labels.namespace }} nao-Ready ha mais de 10m"
|
||||
|
||||
Reference in New Issue
Block a user