Skip to content

Commit 7626525

Browse files
committed
Ref #32619: update kube-prometheus
1 parent 0e97477 commit 7626525

File tree

94 files changed

+24404
-19647
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

94 files changed

+24404
-19647
lines changed

bases/monitoring/kustomization.yaml

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,11 +7,14 @@ resources:
77
- manifests/setup/0podmonitorCustomResourceDefinition.yaml
88
- manifests/setup/0probeCustomResourceDefinition.yaml
99
- manifests/setup/0prometheusCustomResourceDefinition.yaml
10+
- manifests/setup/0prometheusagentCustomResourceDefinition.yaml
1011
- manifests/setup/0prometheusruleCustomResourceDefinition.yaml
12+
- manifests/setup/0scrapeconfigCustomResourceDefinition.yaml
1113
- manifests/setup/0servicemonitorCustomResourceDefinition.yaml
1214
- manifests/setup/0thanosrulerCustomResourceDefinition.yaml
1315
- manifests/setup/namespace.yaml
1416
- manifests/alertmanager-alertmanager.yaml
17+
- manifests/alertmanager-networkPolicy.yaml
1518
- manifests/alertmanager-podDisruptionBudget.yaml
1619
- manifests/alertmanager-prometheusRule.yaml
1720
- manifests/alertmanager-secret.yaml
@@ -22,6 +25,7 @@ resources:
2225
- manifests/blackboxExporter-clusterRoleBinding.yaml
2326
- manifests/blackboxExporter-configuration.yaml
2427
- manifests/blackboxExporter-deployment.yaml
28+
- manifests/blackboxExporter-networkPolicy.yaml
2529
- manifests/blackboxExporter-service.yaml
2630
- manifests/blackboxExporter-serviceAccount.yaml
2731
- manifests/blackboxExporter-serviceMonitor.yaml
@@ -30,13 +34,16 @@ resources:
3034
- manifests/grafana-dashboardDefinitions.yaml
3135
- manifests/grafana-dashboardSources.yaml
3236
- manifests/grafana-deployment.yaml
37+
- manifests/grafana-networkPolicy.yaml
38+
- manifests/grafana-prometheusRule.yaml
3339
- manifests/grafana-service.yaml
3440
- manifests/grafana-serviceAccount.yaml
3541
- manifests/grafana-serviceMonitor.yaml
3642
- manifests/kubePrometheus-prometheusRule.yaml
3743
- manifests/kubeStateMetrics-clusterRole.yaml
3844
- manifests/kubeStateMetrics-clusterRoleBinding.yaml
3945
- manifests/kubeStateMetrics-deployment.yaml
46+
- manifests/kubeStateMetrics-networkPolicy.yaml
4047
- manifests/kubeStateMetrics-prometheusRule.yaml
4148
- manifests/kubeStateMetrics-service.yaml
4249
- manifests/kubeStateMetrics-serviceAccount.yaml
@@ -50,12 +57,14 @@ resources:
5057
- manifests/nodeExporter-clusterRole.yaml
5158
- manifests/nodeExporter-clusterRoleBinding.yaml
5259
- manifests/nodeExporter-daemonset.yaml
60+
- manifests/nodeExporter-networkPolicy.yaml
5361
- manifests/nodeExporter-prometheusRule.yaml
5462
- manifests/nodeExporter-service.yaml
5563
- manifests/nodeExporter-serviceAccount.yaml
5664
- manifests/nodeExporter-serviceMonitor.yaml
5765
- manifests/prometheus-clusterRole.yaml
5866
- manifests/prometheus-clusterRoleBinding.yaml
67+
- manifests/prometheus-networkPolicy.yaml
5968
- manifests/prometheus-podDisruptionBudget.yaml
6069
- manifests/prometheus-prometheus.yaml
6170
- manifests/prometheus-prometheusRule.yaml
@@ -74,6 +83,7 @@ resources:
7483
- manifests/prometheusAdapter-clusterRoleServerResources.yaml
7584
- manifests/prometheusAdapter-configMap.yaml
7685
- manifests/prometheusAdapter-deployment.yaml
86+
- manifests/prometheusAdapter-networkPolicy.yaml
7787
- manifests/prometheusAdapter-podDisruptionBudget.yaml
7888
- manifests/prometheusAdapter-roleBindingAuthReader.yaml
7989
- manifests/prometheusAdapter-service.yaml
@@ -82,6 +92,7 @@ resources:
8292
- manifests/prometheusOperator-clusterRole.yaml
8393
- manifests/prometheusOperator-clusterRoleBinding.yaml
8494
- manifests/prometheusOperator-deployment.yaml
95+
- manifests/prometheusOperator-networkPolicy.yaml
8596
- manifests/prometheusOperator-prometheusRule.yaml
8697
- manifests/prometheusOperator-service.yaml
8798
- manifests/prometheusOperator-serviceAccount.yaml

bases/monitoring/manifests/alertmanager-alertmanager.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,11 +6,11 @@ metadata:
66
app.kubernetes.io/instance: main
77
app.kubernetes.io/name: alertmanager
88
app.kubernetes.io/part-of: kube-prometheus
9-
app.kubernetes.io/version: 0.23.0
9+
app.kubernetes.io/version: 0.26.0
1010
name: main
1111
namespace: monitoring
1212
spec:
13-
image: quay.io/prometheus/alertmanager:v0.23.0
13+
image: quay.io/prometheus/alertmanager:v0.26.0
1414
nodeSelector:
1515
kubernetes.io/os: linux
1616
podMetadata:
@@ -19,7 +19,7 @@ spec:
1919
app.kubernetes.io/instance: main
2020
app.kubernetes.io/name: alertmanager
2121
app.kubernetes.io/part-of: kube-prometheus
22-
app.kubernetes.io/version: 0.23.0
22+
app.kubernetes.io/version: 0.26.0
2323
replicas: 3
2424
resources:
2525
limits:
@@ -33,4 +33,4 @@ spec:
3333
runAsNonRoot: true
3434
runAsUser: 1000
3535
serviceAccountName: alertmanager-main
36-
version: 0.23.0
36+
version: 0.26.0
Lines changed: 42 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,42 @@
1+
apiVersion: networking.k8s.io/v1
2+
kind: NetworkPolicy
3+
metadata:
4+
labels:
5+
app.kubernetes.io/component: alert-router
6+
app.kubernetes.io/instance: main
7+
app.kubernetes.io/name: alertmanager
8+
app.kubernetes.io/part-of: kube-prometheus
9+
app.kubernetes.io/version: 0.26.0
10+
name: alertmanager-main
11+
namespace: monitoring
12+
spec:
13+
egress:
14+
- {}
15+
ingress:
16+
- from:
17+
- podSelector:
18+
matchLabels:
19+
app.kubernetes.io/name: prometheus
20+
ports:
21+
- port: 9093
22+
protocol: TCP
23+
- port: 8080
24+
protocol: TCP
25+
- from:
26+
- podSelector:
27+
matchLabels:
28+
app.kubernetes.io/name: alertmanager
29+
ports:
30+
- port: 9094
31+
protocol: TCP
32+
- port: 9094
33+
protocol: UDP
34+
podSelector:
35+
matchLabels:
36+
app.kubernetes.io/component: alert-router
37+
app.kubernetes.io/instance: main
38+
app.kubernetes.io/name: alertmanager
39+
app.kubernetes.io/part-of: kube-prometheus
40+
policyTypes:
41+
- Egress
42+
- Ingress

bases/monitoring/manifests/alertmanager-podDisruptionBudget.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ metadata:
66
app.kubernetes.io/instance: main
77
app.kubernetes.io/name: alertmanager
88
app.kubernetes.io/part-of: kube-prometheus
9-
app.kubernetes.io/version: 0.23.0
9+
app.kubernetes.io/version: 0.26.0
1010
name: alertmanager-main
1111
namespace: monitoring
1212
spec:

bases/monitoring/manifests/alertmanager-prometheusRule.yaml

Lines changed: 14 additions & 32 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ metadata:
66
app.kubernetes.io/instance: main
77
app.kubernetes.io/name: alertmanager
88
app.kubernetes.io/part-of: kube-prometheus
9-
app.kubernetes.io/version: 0.23.0
9+
app.kubernetes.io/version: 0.26.0
1010
prometheus: k8s
1111
role: alert-rules
1212
name: alertmanager-main-rules
@@ -17,8 +17,7 @@ spec:
1717
rules:
1818
- alert: AlertmanagerFailedReload
1919
annotations:
20-
description: Configuration has failed to load for {{ $labels.namespace }}/{{
21-
$labels.pod}}.
20+
description: Configuration has failed to load for {{ $labels.namespace }}/{{ $labels.pod}}.
2221
runbook_url: https://runbooks.prometheus-operator.dev/runbooks/alertmanager/alertmanagerfailedreload
2322
summary: Reloading an Alertmanager configuration has failed.
2423
expr: |
@@ -30,11 +29,9 @@ spec:
3029
severity: critical
3130
- alert: AlertmanagerMembersInconsistent
3231
annotations:
33-
description: Alertmanager {{ $labels.namespace }}/{{ $labels.pod}} has only
34-
found {{ $value }} members of the {{$labels.job}} cluster.
32+
description: Alertmanager {{ $labels.namespace }}/{{ $labels.pod}} has only found {{ $value }} members of the {{$labels.job}} cluster.
3533
runbook_url: https://runbooks.prometheus-operator.dev/runbooks/alertmanager/alertmanagermembersinconsistent
36-
summary: A member of an Alertmanager cluster has not found all other cluster
37-
members.
34+
summary: A member of an Alertmanager cluster has not found all other cluster members.
3835
expr: |
3936
# Without max_over_time, failed scrapes could create false negatives, see
4037
# https://www.robustperception.io/alerting-on-gauges-in-prometheus-2-0 for details.
@@ -46,9 +43,7 @@ spec:
4643
severity: critical
4744
- alert: AlertmanagerFailedToSendAlerts
4845
annotations:
49-
description: Alertmanager {{ $labels.namespace }}/{{ $labels.pod}} failed
50-
to send {{ $value | humanizePercentage }} of notifications to {{ $labels.integration
51-
}}.
46+
description: Alertmanager {{ $labels.namespace }}/{{ $labels.pod}} failed to send {{ $value | humanizePercentage }} of notifications to {{ $labels.integration }}.
5247
runbook_url: https://runbooks.prometheus-operator.dev/runbooks/alertmanager/alertmanagerfailedtosendalerts
5348
summary: An Alertmanager instance failed to send notifications.
5449
expr: |
@@ -63,12 +58,9 @@ spec:
6358
severity: warning
6459
- alert: AlertmanagerClusterFailedToSendAlerts
6560
annotations:
66-
description: The minimum notification failure rate to {{ $labels.integration
67-
}} sent from any instance in the {{$labels.job}} cluster is {{ $value |
68-
humanizePercentage }}.
61+
description: The minimum notification failure rate to {{ $labels.integration }} sent from any instance in the {{$labels.job}} cluster is {{ $value | humanizePercentage }}.
6962
runbook_url: https://runbooks.prometheus-operator.dev/runbooks/alertmanager/alertmanagerclusterfailedtosendalerts
70-
summary: All Alertmanager instances in a cluster failed to send notifications
71-
to a critical integration.
63+
summary: All Alertmanager instances in a cluster failed to send notifications to a critical integration.
7264
expr: |
7365
min by (namespace,service, integration) (
7466
rate(alertmanager_notifications_failed_total{job="alertmanager-main",namespace="monitoring", integration=~`.*`}[5m])
@@ -81,12 +73,9 @@ spec:
8173
severity: critical
8274
- alert: AlertmanagerClusterFailedToSendAlerts
8375
annotations:
84-
description: The minimum notification failure rate to {{ $labels.integration
85-
}} sent from any instance in the {{$labels.job}} cluster is {{ $value |
86-
humanizePercentage }}.
76+
description: The minimum notification failure rate to {{ $labels.integration }} sent from any instance in the {{$labels.job}} cluster is {{ $value | humanizePercentage }}.
8777
runbook_url: https://runbooks.prometheus-operator.dev/runbooks/alertmanager/alertmanagerclusterfailedtosendalerts
88-
summary: All Alertmanager instances in a cluster failed to send notifications
89-
to a non-critical integration.
78+
summary: All Alertmanager instances in a cluster failed to send notifications to a non-critical integration.
9079
expr: |
9180
min by (namespace,service, integration) (
9281
rate(alertmanager_notifications_failed_total{job="alertmanager-main",namespace="monitoring", integration!~`.*`}[5m])
@@ -99,8 +88,7 @@ spec:
9988
severity: warning
10089
- alert: AlertmanagerConfigInconsistent
10190
annotations:
102-
description: Alertmanager instances within the {{$labels.job}} cluster have
103-
different configurations.
91+
description: Alertmanager instances within the {{$labels.job}} cluster have different configurations.
10492
runbook_url: https://runbooks.prometheus-operator.dev/runbooks/alertmanager/alertmanagerconfiginconsistent
10593
summary: Alertmanager instances within the same cluster have different configurations.
10694
expr: |
@@ -113,12 +101,9 @@ spec:
113101
severity: critical
114102
- alert: AlertmanagerClusterDown
115103
annotations:
116-
description: '{{ $value | humanizePercentage }} of Alertmanager instances
117-
within the {{$labels.job}} cluster have been up for less than half of the
118-
last 5m.'
104+
description: '{{ $value | humanizePercentage }} of Alertmanager instances within the {{$labels.job}} cluster have been up for less than half of the last 5m.'
119105
runbook_url: https://runbooks.prometheus-operator.dev/runbooks/alertmanager/alertmanagerclusterdown
120-
summary: Half or more of the Alertmanager instances within the same cluster
121-
are down.
106+
summary: Half or more of the Alertmanager instances within the same cluster are down.
122107
expr: |
123108
(
124109
count by (namespace,service) (
@@ -135,12 +120,9 @@ spec:
135120
severity: critical
136121
- alert: AlertmanagerClusterCrashlooping
137122
annotations:
138-
description: '{{ $value | humanizePercentage }} of Alertmanager instances
139-
within the {{$labels.job}} cluster have restarted at least 5 times in the
140-
last 10m.'
123+
description: '{{ $value | humanizePercentage }} of Alertmanager instances within the {{$labels.job}} cluster have restarted at least 5 times in the last 10m.'
141124
runbook_url: https://runbooks.prometheus-operator.dev/runbooks/alertmanager/alertmanagerclustercrashlooping
142-
summary: Half or more of the Alertmanager instances within the same cluster
143-
are crashlooping.
125+
summary: Half or more of the Alertmanager instances within the same cluster are crashlooping.
144126
expr: |
145127
(
146128
count by (namespace,service) (

bases/monitoring/manifests/alertmanager-secret.yaml

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ metadata:
66
app.kubernetes.io/instance: main
77
app.kubernetes.io/name: alertmanager
88
app.kubernetes.io/part-of: kube-prometheus
9-
app.kubernetes.io/version: 0.23.0
9+
app.kubernetes.io/version: 0.26.0
1010
name: alertmanager-main
1111
namespace: monitoring
1212
stringData:
@@ -28,10 +28,17 @@ stringData:
2828
- "severity = warning"
2929
"target_matchers":
3030
- "severity = info"
31+
- "equal":
32+
- "namespace"
33+
"source_matchers":
34+
- "alertname = InfoInhibitor"
35+
"target_matchers":
36+
- "severity = info"
3137
"receivers":
3238
- "name": "Default"
3339
- "name": "Watchdog"
3440
- "name": "Critical"
41+
- "name": "null"
3542
"route":
3643
"group_by":
3744
- "namespace"
@@ -43,6 +50,9 @@ stringData:
4350
- "matchers":
4451
- "alertname = Watchdog"
4552
"receiver": "Watchdog"
53+
- "matchers":
54+
- "alertname = InfoInhibitor"
55+
"receiver": "null"
4656
- "matchers":
4757
- "severity = critical"
4858
"receiver": "Critical"

bases/monitoring/manifests/alertmanager-service.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ metadata:
66
app.kubernetes.io/instance: main
77
app.kubernetes.io/name: alertmanager
88
app.kubernetes.io/part-of: kube-prometheus
9-
app.kubernetes.io/version: 0.23.0
9+
app.kubernetes.io/version: 0.26.0
1010
name: alertmanager-main
1111
namespace: monitoring
1212
spec:
Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,12 @@
11
apiVersion: v1
2+
automountServiceAccountToken: false
23
kind: ServiceAccount
34
metadata:
45
labels:
56
app.kubernetes.io/component: alert-router
67
app.kubernetes.io/instance: main
78
app.kubernetes.io/name: alertmanager
89
app.kubernetes.io/part-of: kube-prometheus
9-
app.kubernetes.io/version: 0.23.0
10+
app.kubernetes.io/version: 0.26.0
1011
name: alertmanager-main
1112
namespace: monitoring

bases/monitoring/manifests/alertmanager-serviceMonitor.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ metadata:
66
app.kubernetes.io/instance: main
77
app.kubernetes.io/name: alertmanager
88
app.kubernetes.io/part-of: kube-prometheus
9-
app.kubernetes.io/version: 0.23.0
9+
app.kubernetes.io/version: 0.26.0
1010
name: alertmanager-main
1111
namespace: monitoring
1212
spec:

bases/monitoring/manifests/blackboxExporter-clusterRoleBinding.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,9 +5,8 @@ metadata:
55
app.kubernetes.io/component: exporter
66
app.kubernetes.io/name: blackbox-exporter
77
app.kubernetes.io/part-of: kube-prometheus
8-
app.kubernetes.io/version: 0.19.0
8+
app.kubernetes.io/version: 0.24.0
99
name: blackbox-exporter
10-
namespace: monitoring
1110
roleRef:
1211
apiGroup: rbac.authorization.k8s.io
1312
kind: ClusterRole

0 commit comments

Comments
 (0)