Skip to content

Commit

Permalink
fix: inhibit_rules in monitoring
Browse files Browse the repository at this point in the history
  • Loading branch information
grifonas committed Aug 20, 2024
1 parent 42964bf commit fa38a40
Showing 1 changed file with 5 additions and 10 deletions.
15 changes: 5 additions & 10 deletions monitoring/assets/helm-values-monitoring.tpl
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,8 @@ defaultRules:
KubeMemoryOvercommit: true
KubeCPUOvercommit: true
AlertmanagerFailedToSendAlerts: true
CPUThrottlingHigh: true
KubeletTooManyPods: true

alertmanager:
ingress:
Expand Down Expand Up @@ -69,19 +71,12 @@ alertmanager:
- alertname
source_matchers:
- severity = warning
target_matchers:
- target_matchers:
- severity = info
- equal:
- namespace
source_matchers:
- alertname = InfoInhibitor
target_matchers:
- severity = info
- target_matchers:
- alertname = InfoInhibitor
# https://runbooks.prometheus-operator.dev/runbooks/kubernetes/cputhrottlinghigh/
- target_matchers:
- alertname = CPUThrottlingHigh
- target_matchers:
- alertname = AlertmanagerFailedToSendAlerts

Expand Down Expand Up @@ -581,9 +576,9 @@ additionalPrometheusRulesMap:
severity: warning
- alert: NginxLatency
annotations:
message: Ingress {{ $labels.host }} 95th req. latency percentile {{ $value }}.
message: Ingress {{ $labels.host }} 99th req. latency percentile {{ $value }}.
runbook_url: https://github.com/contiamo/ops-docs/tree/master/runbook/NginxIngressMetrics.md#nginxerrors
expr: histogram_quantile(0.95, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=""}[5m])) by (le, ingress, host, exported_namespace)) > 2
expr: histogram_quantile(0.99, sum(rate(nginx_ingress_controller_request_duration_seconds_bucket{ingress!=""}[5m])) by (le, ingress, host, exported_namespace)) > 10
for: 10m
labels:
severity: warning

0 comments on commit fa38a40

Please sign in to comment.