diff --git a/clusters/monitor/alert-rules-patch.yaml b/clusters/monitor/alert-rules-patch.yaml index 1afe66c..de754bb 100644 --- a/clusters/monitor/alert-rules-patch.yaml +++ b/clusters/monitor/alert-rules-patch.yaml @@ -17,7 +17,7 @@ metadata: data: alerting_rules.yml: | groups: - - name: Load-monitoring + - name: host-monitoring rules: - alert: HighLoad expr: node_load1 > 2.0 for: 5m @@ -26,8 +26,6 @@ data: annotations: summary: High load on {{ $labels.instance }} description: "Load is {{ $value }} (threshold: 2.0)" - - name: cpu-usage-monitoring - rules: - alert: HighCpuUsage expr: 100 - (avg by (instance) (irate(node_cpu_seconds_total{mode="idle"}[5m])) * 100) > 90 for: 5m labels: @@ -35,8 +33,6 @@ data: annotations: summary: High CPU usage on {{ $labels.instance }} description: "CPU usage is {{ $value }}%" - - name: memory-usage-monitoring - rules: - alert: HighMemoryUsage expr: (node_memory_MemTotal_bytes - node_memory_MemFree_bytes - node_memory_Buffers_bytes - node_memory_Cached_bytes) / node_memory_MemTotal_bytes * 100 > 90 for: 5m @@ -45,8 +41,6 @@ data: annotations: summary: High memory usage on {{ $labels.instance }} description: "Memory usage is {{ $value }}%" - - name: disk-usage-monitoring - rules: - alert: HighDiskUsage expr: node_filesystem_avail_bytes{fstype="ext4"} / node_filesystem_size_bytes{fstype="ext4"} * 100 < 10 for: 5m