Skip to content

Commit

Permalink
move-shared-alerts-to-phoemix (#1214)
Browse files Browse the repository at this point in the history
  • Loading branch information
QuentinBisson authored Jun 6, 2024
1 parent 5bcefb6 commit 5ad1ff9
Show file tree
Hide file tree
Showing 6 changed files with 19 additions and 23 deletions.
8 changes: 0 additions & 8 deletions helm/prometheus-rules/templates/_helpers.tpl
Original file line number Diff line number Diff line change
Expand Up @@ -53,14 +53,6 @@ true
{{- end -}}
{{- end -}}

{{- define "isClusterServiceInstalled" -}}
{{ not (eq .Values.managementCluster.provider.flavor "capi") }}
{{- end -}}

{{- define "isVaultBeingMonitored" -}}
{{ not (eq .Values.managementCluster.provider.flavor "capi") }}
{{- end -}}

{{- define "isBastionBeingMonitored" -}}
{{ not (eq .Values.managementCluster.provider.flavor "capi") }}
{{- end -}}
Expand Down
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
## TODO Remove with vintage
{{- if eq .Values.managementCluster.provider.flavor "vintage" }}
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
Expand All @@ -21,7 +22,7 @@ spec:
area: kaas
cancel_if_outside_working_hours: {{ include "workingHoursOnly" . }}
severity: notify
team: {{ include "providerTeam" . }}
team: phoenix
topic: kubernetes
- alert: CalicoNodeMemoryHighUtilization
annotations:
Expand All @@ -36,6 +37,6 @@ spec:
area: kaas
cancel_if_outside_working_hours: {{ include "workingHoursOnly" . }}
severity: notify
team: {{ include "providerTeam" . }}
team: phoenix
topic: kubernetes
{{- end }}
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
{{- if eq (include "isClusterServiceInstalled" .) "true" }}
## TODO Remove with vintage
{{- if eq .Values.managementCluster.provider.flavor "vintage" }}
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
Expand All @@ -23,7 +24,7 @@ spec:
labels:
area: storage
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: managementcluster
{{- if eq .Values.managementCluster.pipeline "testing" }}
- alert: TestClusterTooOld
Expand All @@ -33,5 +34,6 @@ spec:
for: 5m
labels:
severity: notify
team: phoenix
{{- end }}
{{- end }}
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
## TODO Remove with vintage
{{- if eq .Values.managementCluster.provider.flavor "vintage" }}
# newer clusters don't use docker anymore
apiVersion: monitoring.coreos.com/v1
Expand All @@ -22,6 +23,6 @@ spec:
area: kaas
cancel_if_outside_working_hours: "true"
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: observability
{{- end }}
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
{{- if eq (include "isVaultBeingMonitored" .) "true" }}
## TODO Remove with vintage
{{- if eq .Values.managementCluster.provider.flavor "vintage" }}
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
Expand All @@ -23,7 +24,7 @@ spec:
area: kaas
cancel_if_outside_working_hours: {{ include "workingHoursOnly" . }}
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: vault
- alert: VaultIsSealed
annotations:
Expand All @@ -35,7 +36,7 @@ spec:
area: kaas
cancel_if_outside_working_hours: {{ include "workingHoursOnly" . }}
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: vault
- alert: ClusterServiceVaultTokenAlmostExpired
annotations:
Expand All @@ -47,7 +48,7 @@ spec:
area: kaas
cancel_if_outside_working_hours: "true"
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: vault
- alert: ClusterServiceVaultTokenAlmostExpiredMissing
annotations:
Expand All @@ -60,7 +61,7 @@ spec:
cancel_if_outside_working_hours: {{ include "workingHoursOnly" . }}
cancel_if_prometheus_agent_down: "true"
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: vault
- alert: CertOperatorVaultTokenAlmostExpired
annotations:
Expand All @@ -72,7 +73,7 @@ spec:
area: kaas
cancel_if_outside_working_hours: "true"
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: vault
- alert: CertOperatorVaultTokenAlmostExpiredMissing
annotations:
Expand All @@ -84,7 +85,7 @@ spec:
area: kaas
cancel_if_outside_working_hours: {{ include "workingHoursOnly" . }}
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: vault
- alert: VaultLatestEtcdBackupTooOld
annotations:
Expand All @@ -96,7 +97,7 @@ spec:
area: kaas
cancel_if_outside_working_hours: "true"
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: vault
- alert: VaultLatestEtcdBackupMetricsMissing
annotations:
Expand All @@ -108,7 +109,6 @@ spec:
area: kaas
cancel_if_outside_working_hours: "true"
severity: page
team: {{ include "providerTeam" . }}
team: phoenix
topic: vault

{{- end }}

0 comments on commit 5ad1ff9

Please sign in to comment.