blob: 7c446cd85eac67d926edcc0a4404dfb7162206db (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
|
---
g_template_os_linux:
name: Template OS Linux
zitems:
- key: kernel.uname.sysname
applications:
- Kernel
value_type: string
- key: kernel.all.cpu.wait.total
applications:
- Kernel
value_type: int
- key: kernel.all.cpu.irq.hard
applications:
- Kernel
value_type: int
- key: kernel.all.cpu.idle
applications:
- Kernel
value_type: int
- key: kernel.uname.distro
applications:
- Kernel
value_type: string
- key: kernel.uname.nodename
applications:
- Kernel
value_type: string
- key: kernel.all.cpu.irq.soft
applications:
- Kernel
value_type: int
- key: kernel.all.load.15_minute
applications:
- Kernel
value_type: float
- key: kernel.all.cpu.sys
applications:
- Kernel
value_type: int
- key: kernel.all.load.5_minute
applications:
- Kernel
value_type: float
- key: mem.freemem
applications:
- Memory
value_type: int
- key: kernel.all.cpu.nice
applications:
- Kernel
value_type: int
- key: mem.util.bufmem
applications:
- Memory
value_type: int
- key: swap.used
applications:
- Memory
value_type: int
- key: kernel.all.load.1_minute
applications:
- Kernel
value_type: float
- key: kernel.uname.version
applications:
- Kernel
value_type: string
- key: swap.length
applications:
- Memory
value_type: int
- key: mem.physmem
applications:
- Memory
value_type: int
- key: kernel.all.uptime
applications:
- Kernel
value_type: int
- key: swap.free
applications:
- Memory
value_type: int
- key: mem.util.available
applications:
- Memory
value_type: int
- key: mem.util.used
applications:
- Memory
value_type: int
- key: kernel.all.cpu.user
applications:
- Kernel
value_type: int
- key: kernel.uname.machine
applications:
- Kernel
value_type: string
- key: hinv.ncpu
applications:
- Kernel
value_type: int
- key: mem.util.cached
applications:
- Memory
value_type: int
- key: kernel.all.cpu.steal
applications:
- Kernel
value_type: int
- key: kernel.all.pswitch
applications:
- Kernel
value_type: int
- key: kernel.uname.release
applications:
- Kernel
value_type: string
- key: proc.nprocs
applications:
- Kernel
value_type: int
- key: filesys.full.xvda2
applications:
- Disk
value_type: float
- key: filesys.full.xvda3
applications:
- Disk
value_type: float
ztriggers:
- description: 'Filesystem: / has less than 10% free on {HOST.NAME}'
expression: '{Template OS Linux:filesys.full.xvda2.last()}>90'
url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_filesys_full.asciidoc'
priority: warn
- description: 'Filesystem: / has less than 5% free on {HOST.NAME}'
expression: '{Template OS Linux:filesys.full.xvda2.last()}>95'
url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_filesys_full.asciidoc'
priority: high
- description: 'Filesystem: /var has less than 10% free on {HOST.NAME}'
expression: '{Template OS Linux:filesys.full.xvda3.last()}>90'
url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_filesys_full.asciidoc'
priority: warn
- description: 'Filesystem: /var has less than 5% free on {HOST.NAME}'
expression: '{Template OS Linux:filesys.full.xvda3.last()}>95'
url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_filesys_full.asciidoc'
priority: high
- description: 'Too many TOTAL processes on {HOST.NAME}'
expression: '{Template OS Linux:proc.nprocs.last()}>5000'
url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_proc.asciidoc'
priority: warn
- description: 'Lack of available memory on {HOST.NAME}'
expression: '{Template OS Linux:mem.freemem.last()}<3000'
url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_memory.asciidoc'
priority: warn
|