diff --git a/conf/prometheus/alerts/node.yml b/conf/prometheus/alerts/node.yml index 1fe550a..0f02673 100644 --- a/conf/prometheus/alerts/node.yml +++ b/conf/prometheus/alerts/node.yml @@ -137,13 +137,13 @@ groups: # Alert threshold depends on nature of application. # Please read: https://github.com/samber/awesome-prometheus-alerts/issues/58 - alert: HostContextSwitching - expr: (rate(node_context_switches_total[5m])) / (count without(cpu, mode) (node_cpu_seconds_total{mode="idle"})) > 2000 + expr: (rate(node_context_switches_total[5m])) / (count without(cpu, mode) (node_cpu_seconds_total{mode="idle"})) > 4000 for: 0m labels: severity: warning annotations: summary: Host context switching (instance {{ $labels.instance }}) - description: "Context switching is growing on node (> 2000 / s)\n VALUE = {{ $value }}\n LABELS = {{ $labels }}" + description: "Context switching is growing on node (> 4000 / s)\n VALUE = {{ $value }}\n LABELS = {{ $labels }}" - alert: HostSwapIsFillingUp expr: (1 - (node_memory_SwapFree_bytes / node_memory_SwapTotal_bytes)) * 100 > 80