Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion chart/infra-server/Chart.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -15,5 +15,5 @@ dependencies:
version: "0.45.9"
repository: "https://argoproj.github.io/argo-helm"
- name: kube-prometheus
version: 11.1.1
version: 11.3.10
repository: https://charts.bitnami.com/bitnami
6 changes: 6 additions & 0 deletions chart/infra-server/monitoring-values.yaml
Original file line number Diff line number Diff line change
@@ -1,6 +1,8 @@
kube-prometheus:
namespaceOverride: monitoring
operator:
image:
repository: bitnamilegacy/prometheus-operator
resources:
limits:
cpu: 100m
Expand All @@ -14,6 +16,8 @@ kube-prometheus:
enabled: false

prometheus:
image:
repository: bitnamilegacy/prometheus
persistence:
enabled: true
resources:
Expand Down Expand Up @@ -45,6 +49,8 @@ kube-prometheus:
enabled: false

alertmanager:
image:
repository: bitnamilegacy/alertmanager
resources:
limits:
cpu: 100m
Expand Down
6 changes: 3 additions & 3 deletions chart/infra-server/requirements.lock
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,6 @@ dependencies:
version: 0.45.9
- name: kube-prometheus
repository: https://charts.bitnami.com/bitnami
version: 11.1.1
digest: sha256:46322f064751933585c0985dad77996ed8ee216df0fed19ea9c40f7935f67ae7
generated: "2025-03-05T10:30:52.962223+01:00"
version: 11.3.10
digest: sha256:59c5c412a14a5ce69cdc7745be5d37603ee0e7748608a586a2b812da4457e60a
generated: "2025-10-01T13:00:11.143106+02:00"
7 changes: 7 additions & 0 deletions chart/infra-server/templates/monitoring/alertmanager.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,8 +11,15 @@ spec:
route:
receiver: 'slack-notifications'
groupBy: [alertname, job, app]
routes:
- matchers:
- name: alertname
value: InfoInhibitor
receiver: 'null'
continue: false

receivers:
- name: 'null'
- name: 'slack-notifications'
slackConfigs:
- apiURL:
Expand Down
4 changes: 2 additions & 2 deletions chart/infra-server/templates/monitoring/rules.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ spec:
interval: 30s
rules:
- alert: Workflow Error
expr: increase(argo_workflows_count{status="Error"}[5m]) > 0
expr: increase(argo_workflows_gauge{status="Error"}[5m]) > 0
for: 1m
annotations:
summary: A workflow has errored
Expand All @@ -20,7 +20,7 @@ spec:
namespace: monitoring
environment: {{ .Values.environment }}
- alert: Workflow Failure
expr: increase(argo_workflows_count{status="Failed"}[5m]) > 0
expr: increase(argo_workflows_gauge{status="Failed"}[5m]) > 0
for: 1m
annotations:
summary: A workflow has failed.
Expand Down
Loading