-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathpm_logconv_rules.conf
298 lines (254 loc) · 7.24 KB
/
pm_logconv_rules.conf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
#
# pm_logconv_rules.conf : Config file of pm_logconv for Pacemaker and Corosync
#
###
# For Resource event.
###
#MsgNo.1-1, 2-1, 4-1, 5-1, 11-1, 12-1, 17-1, 18-1
[Resource tries to operation]
pattern=crmd,info:,Performing,key=,op=,!_monitor_,!_notify_0
func=try_to_operate
#MsgNo.1-2, 2-2, 4-2, 5-2, 11-2, 12-2, 17-2, 18-2
[Resource operation succeeded]
pattern=crmd,notice:,Result of,operation for,: 0,!(probe|monitor|notify) operation
func=operation_succeeded
loglevel=info
#MsgNo.1-3, 2-3, 3-1, 4-3, 5-3, 11-3, 12-3, 17-3, 19-1
[Resource operation failed]
pattern_info=crmd,info:,Result of,operation for,!: [078],!(probe|notify) operation,!: (Timed Out|Cancelled)
pattern_notice=crmd,notice:,Result of,operation for,!: [078],!(probe|notify) operation
pattern_error=crmd,error:,Result of,operation for,!(probe|notify) operation,!: Timed Out
func=operation_failed
loglevel=error
#MsgNo.1-4, 2-4, 3-3, 4-4, 5-4, 11-4, 12-4, 17-4, 19-3
[OCF resource operation timedout]
pattern=crmd,error:,Result of,operation for,!probe operation,!notify operation,: Timed Out
func=operation_timedout_ocf
#MsgNo.3-2
[Detect resource does not running]
pattern=crmd,info:,Result of monitor operation for,: 7,not running
func=detect_rsc_failure
loglevel=error
###
# For Node status event.
##
#MsgNo.6-1, 6-2
[Node status updated]
pattern_lost=crmd,info:,is now lost
pattern_member=crmd,info:,is now member,!expected state
func=node_status_updated
#MsgNo.6-3
[Node status determined]
pattern=pengine,Node,is
func=node_status_determined
###
# For Interconnect-LAN status event
# and Network status event (detected by ping).
###
#MsgNo.7-1
[Interconnect-LAN status dead]
pattern=corosync,,Marking seqid,ringid,interface,FAULTY
func=detect_iconnlan_dead
loglevel=warning
#MsgNo.7-2
[Interconnect-LAN status recover]
pattern=corosync,Automatically recovered ring
func=detect_iconnlan_recover
#MsgNo.8-1
[Network status dead]
pattern=ping,is inactive:
func=detect_node_dead
loglevel=error
###
# For Disk status event (detected by diskd).
###
#MsgNo.9-1
[Detect disk error]
pattern=diskd,warning:,disk status is changed,new_status,ERROR
func=detect_disk_error
loglevel=error
###
# For respawn process event.
###
#MsgNo.10-1
[Respawn process starts]
pattern=pacemakerd,info:,Forked child,for process
func=respawn_start
#MsgNo.10-2, 10-4, 10-5
[Respawn process exited abnormally]
pattern_notok=pacemakerd,error:,process,exited
pattern_respawnstop=pacemakerd,warning:,can no longer be respawned
pattern_errpanic=pacemakerd,emerg:,instructed the machine to reset
func=respawn_exited_abnormally
loglevel=warning
#MsgNo.10-3
[Respawn process killed]
pattern=pacemakerd,process,terminated with signal
func=respawn_killed
loglevel=warning
#MsgNo.10-6
[Respawn process exited normally]
pattern=pacemakerd,info:,process,exited
func=respawn_exited_normally
#MsgNo.10-7
[Respawning too fast in a short term]
pattern=pacemakerd,error:,Child respawn count exceeded by
func=respawn_too_fast
###
# For Fail Over. These are only for DC node.
##
#MsgNo.F0-1, F9-1, F10-1
[Detect calculation starts]
pattern=crmd,State transition,S_IDLE -> S_POLICY_ENGINE,!I_SHUTDOWN
func=detect_pe_calc
loglevel=warning
#MsgNo.F0-2, F12-1, F12-2
[FailOver complete]
pattern_idle=crmd,State transition,-> S_IDLE
pattern_stopping=crmd,State transition,-> S_STOPPING
func=detect_fo_complete
loglevel=warning
#MsgNo.F1-1, F1-2, F2-1, F2-2, F3-1, F3-2, F4-1, F4-2, F6-1, F6-2
[Action failure]
pattern=crmd,info:,Updating failcount for
func=no_output_msg
fotrigger=1
#MsgNo.F7-1, F7-2
[Node failure]
pattern=corosync,Failed to receive the leave message. failed:
func=no_output_msg
fotrigger=3
#MsgNo.F11-1
#The message is not output immediately, output when F/O is complete.
[Add Resource start action]
pattern=pengine,notice: \* Start
func=add_rsc_start
#MsgNo.F11-2
#The message is not output immediately, output when F/O is complete.
[Add Resource stop action]
pattern=pengine.*notice: \* Stop
func=add_rsc_stop
#MsgNo.F11-3, F11-5, F11-8, F11-9, F11-11, F11-12
#The message is not output immediately, output when F/O is complete.
[Add no action]
pattern_leave=pengine,info: Leave
pattern_recover=pengine,notice: \* Recover,!->
pattern_restart=pengine,notice: \* Restart
pattern_reload=pengine,notice: \* Reload
func=add_no_action
#MsgNo.F11-6, F11-13 ,F11-14
#The message is not output immediately, output when F/O is complete.
[Add Resource move action]
pattern_move=pengine,notice: \* Move
pattern_recover=pengine,notice: \* Recover,->
pattern_migrate=pengine,notice: \* Migrate
func=add_rsc_move
#MsgNo.F11-10
#The message is not output immediately, output when F/O is complete.
[Resource initiating action]
pattern=crmd,notice:,Initiating,operation,!probe_complete
func=rsc_init_action
###
# For DC election.
###
#MsgNo.13-2
[DC election is complete]
pattern=crmd,info:,Set DC to
func=dc_election_complete
#MsgNo.13-5
[Detect unset DC]
pattern=crmd,info:,Unset DC
func=detect_unset_dc
###
# For Pacemaker and Corosync service shutdown.
###
#MsgNo.14-1
[Corosync is shutting down.]
pattern=corosync,Unloading all Corosync service engines.
func=output_static_msg
#MsgNo.14-2
[Corosync shutdown complete.]
pattern=corosync,Corosync Cluster Engine exiting
func=detect_cs_shutdown
#MsgNo.14-3
[Pacemaker is shutting down.]
pattern=pacemakerd,notice:,Shutting down Pacemaker
func=output_static_msg
loglevel=info
#MsgNo.14-4
[Pacemaker shutdown complete.]
pattern=pacemakerd,notice:,Shutdown complete
func=output_static_msg
loglevel=info
#MsgNo.14-5 (only for DC)
[Corosync on the node in the cluster want to shutdown]
pattern=crmd,info:,Creating shutdown request for
func=detect_shutdown_request
###
# For fence operation.
###
#MsgNo.21-1
[fence operation start]
pattern=crmd,notice:,Requesting fencing,of node
func=fence_op_started
loglevel=info
#MsgNo.21-2
[fence operation succeeded]
pattern=crmd,notice:,was terminated,!by a human
func=fence_op_ended
loglevel=info
#MsgNo.21-3
[fence operation failed]
pattern=crmd,notice:,was not terminated
func=fence_op_ended
loglevel=error
#MsgNo.21-4
[fence too many failures]
pattern=crmd,warning:,Too many failures,to fence
func=fence_too_many_failures
loglevel=error
#MsgNo.21-5
[executing stonith device start]
pattern=stonith,info:,Requesting that, perform op
func=exec_st_device_started
#MsgNo.21-6
[executing stonith device succeeded]
pattern=stonith,notice:,Call to,on behalf of,OK
func=exec_st_device_ended
loglevel=info
#MsgNo.21-7
[executing stonith device failed]
pattern=stonith,notice:,Call to,on behalf of,!OK
func=exec_st_device_ended
loglevel=warning
#MsgNo.21-8
[Manual stonith confirm]
pattern=crmd,notice:,was terminated,by a human
func=fence_op_ended
loglevel=info
fotrigger=3
###
# For attribute event.
###
#MsgNo.22-1
[Detect attribute updated]
pattern=attrd,info:,Setting,!-> \(null\),!fail-count-,!last-failure-,!probe_complete,!shutdown
func=detect_attr_updated
loglevel=info
#MsgNo.22-2
[Detect attribute deleted]
pattern=attrd,info:,Setting,-> \(null\),!fail-count-,!last-failure-,!probe_complete,!shutdown
func=detect_attr_deleted
loglevel=info
###
# For Corosync service starts.
###
#MsgNo.23-1
[Detect Corosync is starting]
pattern=corosync,Corosync Cluster Engine,started and ready to provide service
func=detect_cs_start
#MsgNo.23-4
[Detect Pacemaker is starting]
pattern=pacemakerd,notice:,Starting Pacemaker
func=detect_pcmk_start
loglevel=info