From f354b9d96a4710189941484dc8e19e0d1136aeb8 Mon Sep 17 00:00:00 2001 From: David Hoese <david.hoese@ssec.wisc.edu> Date: Fri, 9 Oct 2020 20:05:46 -0500 Subject: [PATCH] Include updated prometheus configs --- admin/kubekorner_geosphere_prometheus_rules.yaml | 8 ++++---- admin/prometheus_kubernetes_values.yaml | 2 +- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/admin/kubekorner_geosphere_prometheus_rules.yaml b/admin/kubekorner_geosphere_prometheus_rules.yaml index 54c1781..aa15d8c 100644 --- a/admin/kubekorner_geosphere_prometheus_rules.yaml +++ b/admin/kubekorner_geosphere_prometheus_rules.yaml @@ -211,23 +211,23 @@ spec: summary: "Host unusual network throughput out (instance {{ $labels.instance }})" description: "Host network interfaces are probably sending too much data (> 100 MB/s)\n VALUE = {{ $value }}\n LABELS: {{ $labels }}" - alert: HostUnusualDiskReadRate - expr: sum by (instance) (irate(node_disk_read_bytes_total[5m])) / 1024 / 1024 > 50 + expr: sum by (instance) (irate(node_disk_read_bytes_total[5m])) / 1024 / 1024 > 150 for: 5m labels: severity: warning ruleGroup: geosphere-node annotations: summary: "Host unusual disk read rate (instance {{ $labels.instance }})" - description: "Disk is probably reading too much data (> 50 MB/s)\n VALUE = {{ $value }}\n LABELS: {{ $labels }}" + description: "Disk is probably reading too much data (> 150 MB/s)\n VALUE = {{ $value }}\n LABELS: {{ $labels }}" - alert: HostUnusualDiskWriteRate - expr: sum by (instance) (irate(node_disk_written_bytes_total[5m])) / 1024 / 1024 > 50 + expr: sum by (instance) (irate(node_disk_written_bytes_total[5m])) / 1024 / 1024 > 150 for: 5m labels: severity: warning ruleGroup: geosphere-node annotations: summary: "Host unusual disk write rate (instance {{ $labels.instance }})" - description: "Disk is probably writing too much data (> 50 MB/s)\n VALUE = {{ $value }}\n LABELS: {{ $labels }}" + description: "Disk is probably writing too much data (> 150 MB/s)\n VALUE = {{ $value }}\n LABELS: {{ $labels }}" - alert: HostOutOfDiskSpace expr: (node_filesystem_avail_bytes{mountpoint="/"} * 100) / node_filesystem_size_bytes{mountpoint="/"} < 10 for: 5m diff --git a/admin/prometheus_kubernetes_values.yaml b/admin/prometheus_kubernetes_values.yaml index 9b338a3..5e82f25 100644 --- a/admin/prometheus_kubernetes_values.yaml +++ b/admin/prometheus_kubernetes_values.yaml @@ -43,7 +43,7 @@ alertmanager: - name: "null" - name: "geosphere-dev-team" slack_configs: - - channel: "#geo2grid" + - channel: "#geosphere" send_resolved: true color: '{{ if eq .Status "firing" }}danger{{ else }}good{{ end }}' title: '[{{ .Status | toUpper }}{{ if eq .Status "firing" }}:{{ .Alerts.Firing | len }}{{ end }}] {{ .GroupLabels.SortedPairs.Values | join " " }} {{ if gt (len .CommonLabels) (len .GroupLabels) }}({{ with .CommonLabels.Remove .GroupLabels.Names }}{{ .Values | join " " }}{{ end }}){{ end }}' -- GitLab