Skip to content

Commit

Permalink
remove alert HighlyAvailableWorkloadIncorrectlySpread
Browse files Browse the repository at this point in the history
  • Loading branch information
raptorsun committed Nov 22, 2021
1 parent 9070ffb commit 20db568
Show file tree
Hide file tree
Showing 5 changed files with 0 additions and 267 deletions.
33 changes: 0 additions & 33 deletions assets/cluster-monitoring-operator/prometheus-rule.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -28,39 +28,6 @@ spec:
for: 15m
labels:
severity: warning
- alert: HighlyAvailableWorkloadIncorrectlySpread
annotations:
description: Workload {{ $labels.namespace }}/{{ $labels.workload }} is incorrectly
spread across multiple nodes which breaks high-availability requirements.
Since the workload is using persistent volumes, manual intervention is needed.
Please follow the guidelines provided in the runbook of this alert to fix
this issue.
runbook_url: https://github.com/openshift/runbooks/blob/master/alerts/HighlyAvailableWorkloadIncorrectlySpread.md
summary: Highly-available workload is incorrectly spread across multiple nodes
and manual intervention is needed.
expr: |
count without (node)
(
group by (node, workload, namespace)
(
kube_pod_info{node!=""}
* on(namespace,pod) group_left(workload)
(
max by(namespace, pod, workload) (kube_pod_spec_volumes_persistentvolumeclaims_info)
* on(namespace,pod) group_left(workload)
(
namespace_workload_pod:kube_pod_owner:relabel
* on(namespace,workload,workload_type) group_left()
(
count without(pod) (namespace_workload_pod:kube_pod_owner:relabel{namespace=~"(openshift-.*|kube-.*|default)"}) > 1
)
)
)
)
) == 1
for: 1h
labels:
severity: warning
- name: openshift-kubernetes.rules
rules:
- expr: sum(rate(container_cpu_usage_seconds_total{container="",pod!=""}[5m]))
Expand Down
33 changes: 0 additions & 33 deletions jsonnet/rules.libsonnet
Original file line number Diff line number Diff line change
Expand Up @@ -22,39 +22,6 @@ function(params) {
severity: 'warning',
},
},
{
expr: |||
count without (node)
(
group by (node, workload, namespace)
(
kube_pod_info{node!=""}
* on(namespace,pod) group_left(workload)
(
max by(namespace, pod, workload) (kube_pod_spec_volumes_persistentvolumeclaims_info)
* on(namespace,pod) group_left(workload)
(
namespace_workload_pod:kube_pod_owner:relabel
* on(namespace,workload,workload_type) group_left()
(
count without(pod) (namespace_workload_pod:kube_pod_owner:relabel{%(namespaceSelector)s}) > 1
)
)
)
)
) == 1
||| % cfg,
alert: 'HighlyAvailableWorkloadIncorrectlySpread',
'for': '1h',
annotations: {
description: 'Workload {{ $labels.namespace }}/{{ $labels.workload }} is incorrectly spread across multiple nodes which breaks high-availability requirements. Since the workload is using persistent volumes, manual intervention is needed. Please follow the guidelines provided in the runbook of this alert to fix this issue.',
summary: 'Highly-available workload is incorrectly spread across multiple nodes and manual intervention is needed.',
runbook_url: 'https://github.com/openshift/runbooks/blob/master/alerts/HighlyAvailableWorkloadIncorrectlySpread.md',
},
labels: {
severity: 'warning',
},
},
],
},
{
Expand Down
1 change: 0 additions & 1 deletion jsonnet/utils/sanitize-rules.libsonnet
Original file line number Diff line number Diff line change
Expand Up @@ -336,7 +336,6 @@ local includeRunbooks = {
AlertmanagerFailedReload: openShiftRunbookCMO('AlertmanagerFailedReload.md'),
ClusterOperatorDegraded: openShiftRunbookCMO('ClusterOperatorDegraded.md'),
ClusterOperatorDown: openShiftRunbookCMO('ClusterOperatorDown.md'),
HighlyAvailableWorkloadIncorrectlySpread: openShiftRunbook('alerts/HighlyAvailableWorkloadIncorrectlySpread.md'),
KubeAPIDown: openShiftRunbookCMO('KubeAPIDown.md'),
KubeDeploymentReplicasMismatch: openShiftRunbookCMO('KubeDeploymentReplicasMismatch.md'),
KubeJobFailed: openShiftRunbookCMO('KubeJobFailed.md'),
Expand Down
61 changes: 0 additions & 61 deletions test/rules/bz2006561.yaml

This file was deleted.

139 changes: 0 additions & 139 deletions test/rules/workload_incorrectly_spread.yaml

This file was deleted.

0 comments on commit 20db568

Please # to comment.