5
5
- alert: HighCPUUsage
6
6
expr: |
7
7
100 - (avg by (instance) (irate(node_cpu_seconds_total{mode="idle"}[1m])) * 100) > {{ cpu_usage_threshold | default(80) }}
8
- for: 10s # this need to be changed for production alerts, its 10s for test purposes only
8
+ for: 30s # this need to be changed for production alerts, its 10s for test purposes only
9
9
labels:
10
10
severity: warning
11
11
annotations:
@@ -16,7 +16,7 @@ groups:
16
16
- alert: HighMemoryUsage
17
17
expr: |
18
18
(1 - (node_memory_MemAvailable_bytes / node_memory_MemTotal_bytes)) * 100 > {{ memory_usage_threshold | default(80) }}
19
- for: 10s # this need to be changed for production alerts, its 10s for test purposes only
19
+ for: 30s # this need to be changed for production alerts, its 10s for test purposes only
20
20
labels:
21
21
severity: warning
22
22
annotations:
@@ -27,7 +27,7 @@ groups:
27
27
- alert: DiskSpaceLow
28
28
expr: |
29
29
(node_filesystem_avail_bytes / node_filesystem_size_bytes) * 100 < {{ disk_space_threshold | default(20) }}
30
- for: 10s # this need to be changed for production alerts, its 10s for test purposes only
30
+ for: 30s # this need to be changed for production alerts, its 10s for test purposes only
31
31
labels:
32
32
severity: warning
33
33
annotations:
@@ -38,7 +38,7 @@ groups:
38
38
- alert: HighDiskIOUsage
39
39
expr: |
40
40
(irate(node_disk_io_time_seconds_total[1m]) * 100) > {{ disk_io_threshold | default(40) }}
41
- for: 10s # this need to be changed for production alerts, its 10s for test purposes only
41
+ for: 30s # this need to be changed for production alerts, its 10s for test purposes only
42
42
labels:
43
43
severity: critical
44
44
annotations:
@@ -59,7 +59,7 @@ groups:
59
59
- alert: DiskInodesLow
60
60
expr: |
61
61
(node_filesystem_files_free / node_filesystem_files) * 100 < {{ inode_threshold | default(10) }}
62
- for: 10s # this need to be changed for production alerts, its 10s for test purposes only
62
+ for: 30s # this need to be changed for production alerts, its 10s for test purposes only
63
63
labels:
64
64
severity: warning
65
65
annotations:
@@ -71,7 +71,7 @@ groups:
71
71
- alert: NodeExporterDown
72
72
expr: |
73
73
up{job="node_exporter"} == 0
74
- for: 10s # this need to be changed for production alerts, its 10s for test purposes only
74
+ for: 30s # this need to be changed for production alerts, its 10s for test purposes only
75
75
labels:
76
76
severity: critical
77
77
annotations:
@@ -82,7 +82,7 @@ groups:
82
82
- alert: GrafanaDown
83
83
expr: |
84
84
up{instance="grafana"} == 0
85
- for: 10s # this need to be changed for production alerts, its 10s for test purposes only
85
+ for: 30s # this need to be changed for production alerts, its 10s for test purposes only
86
86
labels:
87
87
severity: critical
88
88
annotations:
0 commit comments