forked from linux-ha-japan/pm_logconv-hb-1.0
-
Notifications
You must be signed in to change notification settings - Fork 0
/
pm_logconv.conf
432 lines (370 loc) · 12.3 KB
/
pm_logconv.conf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
#
# pm_logconv.conf : Config file of pm_logconv for Pacemaker and Heartbeat
#
# support version
# Pacemaker : stable-1.0 (1.0.9 or more)
# Heartbeat : 3.0.3
#
[Settings]
#ha_log_path = /var/log/ha-log
#output_path = /var/log/pm_logconv.out
#hacf_path = /etc/ha.d/ha.cf
#hostcache_path = /var/lib/heartbeat/hostcache
#syslogformat = True
#reset_interval = 60
#attribute_pingd = not_defined default_ping_set or default_ping_set lt 100
#attribute_diskd = not_defined diskcheck_status or diskcheck_status eq ERROR
#attribute_diskd_inner = not_defined diskcheck_status_internal or diskcheck_status_internal eq ERROR
#logconv_logfacility = daemon
#act_rsc = prmExPostgreSQLDB, prmApPostgreSQLDB
###
# For Resource event.
###
#MsgNo.1-1, 2-1, 4-1, 5-1, 11-1, 12-1, 17-1, 18-1
[Resource tries to operation]
pattern_start=crmd,info:,do_lrm_rsc_op: Performing key,op,start
pattern_stop=crmd,info:,do_lrm_rsc_op: Performing key,op,stop
pattern_promote=crmd,info:,do_lrm_rsc_op:,Performing key, op,promote
pattern_demote=crmd,info:,do_lrm_rsc_op:,Performing key,op,demote
pattern_migrate_to=crmd,info:,do_lrm_rsc_op:,Performing key,op,migrate_to
pattern_migrate_from=crmd,info:,do_lrm_rsc_op:,Performing key,op,migrate_from
func=try_to_operate
#MsgNo.1-2, 2-2, 4-2, 5-2, 11-2, 12-2, 17-2, 18-2
[Resource operation succeeded]
pattern_start=crmd,info:,process_lrm_event:,LRM operation,start,rc=0,!status=,ok
pattern_stop=crmd,info:,process_lrm_event:,LRM operation,stop,rc=0,!status=,ok
pattern_promote=crmd,info:,process_lrm_event,LRM operation,promote,rc=0,!status=,ok
pattern_demote=crmd,info:,process_lrm_event,LRM operation,demote,rc=0,!status=,ok
pattern_migrate_to=crmd,info:,process_lrm_event,LRM operation,migrate_to,rc=0,!status=,ok
pattern_migrate_from=crmd,info:,process_lrm_event,LRM operation,migrate_from,rc=0,!status=,ok
func=operation_succeeded
#MsgNo.1-3, 2-3, 3-1, 4-3, 5-3, 11-3, 12-3, 17-3, 19-1
[Resource operation failed]
pattern_start=crmd,info:,process_lrm_event:,LRM operation,start,!rc=0,!status=
pattern_stop=crmd,info:,process_lrm_event:,LRM operation,stop,!rc=0,!status=
pattern_monitor=crmd,info:,process_lrm_event:,LRM operation,monitor,!monitor_0,!rc=0,!rc=8,!rc=7,!status=
pattern_promote=crmd,info:,process_lrm_event:,LRM operation,promote,!rc=0,!status=
pattern_demote=crmd,info:,process_lrm_event:,LRM operation,demote,!rc=0,!status=
pattern_migrate_to=crmd,info:,process_lrm_event:,LRM operation,migrate_to,!rc=0,!status=
pattern_migrate_from=crmd,info:,process_lrm_event:,LRM operation,migrate_from,!rc=0,!status=
func=operation_failed
loglevel=ERROR
#MsgNo.1-4, 2-4, 3-3, 4-4, 5-4, 11-4, 12-4
[OCF resource operation timedout]
pattern_start=crmd,ERROR:,process_lrm_event:,LRM operation,start,!status=,Timed Out
pattern_stop=crmd,ERROR:,process_lrm_event:,LRM operation,stop,!status=,Timed Out
pattern_monitor=crmd,ERROR:,process_lrm_event:,LRM operation,monitor,!monitor_0,!status=,Timed Out
pattern_promote=crmd,ERROR:,process_lrm_event,LRM operation,promote,!status=,Timed Out
pattern_demote=crmd,ERROR:,process_lrm_event,LRM operation,demote,!status=,Timed Out
pattern_migrate_to=crmd,ERROR:,process_lrm_event,LRM operation,migrate_to,!status=,Timed Out
pattern_migrate_from=crmd,ERROR:,process_lrm_event,LRM operation,migrate_from,!status=,Timed Out
func=operation_timedout_ocf
#MsgNo.3-2, 19-2
[Resource failure]
pattern_monitor_rcs=crmd,info:,process_lrm_event:,LRM operation,monitor,!monitor_0,rc=7,!status=
pattern_monitor_stonith=crmd,info:,process_lrm_event:,LRM operation,monitor,!monitor_0,rc=7,!status=
func=detect_rsc_failure
loglevel=ERROR
###
# For Node status event.
##
#MsgNo.6-1, 6-2
[Node status updated]
pattern_dead=crmd,notice:,crmd_ha_status_callback:,Status update:,Node,now has status,dead
pattern_active=crmd,notice:,crmd_ha_status_callback:,Status update:,Node,now has status,active
func=node_status_updated
#Msg No.6-3
[Node status determined]
pattern=pengine,determine_online_status,Node,is
func=node_status_determined
###
# For Interconnect-LAN status event
# and Network status event (detected by pingd).
###
#MsgNo.7-1
[Interconnect-LAN status dead]
pattern=heartbeat,info:,Link,dead
func=detect_iconnlan_dead
loglevel=WARN
#Msg No.7-2
[Interconnect-LAN or Network status up]
pattern=heartbeat,info:,Link,up
func=detect_network_up
#MsgNo.8-1
[Network status dead]
pattern=pingd,info:,stand_alone_ping:,is unreachable
func=detect_node_dead
loglevel=ERROR
###
# For Disk status event (detected by diskd).
###
#MsgNo.9-1
[Detect disk error]
pattern=diskd,WARN:,check_status:,disk status is changed,new_status,ERROR
func=detect_disk_error
loglevel=ERROR
###
# For respawn process event.
###
#MsgNo.10-1
[Respawn process starts]
pattern=heartbeat,info:,Starting,as,uid,gid
func=respawn_start
#MsgNo.10-2
[Respawn process exited abnormally]
pattern=heartbeat,Managed,process,exited with return code
func=respawn_exited_abnormally
loglevel=WARN
#MsgNo.10-3
[Respawn process killed]
pattern=heartbeat,WARN:,Managed,process,killed by signal
func=respawn_killed
#MsgNo.10-4
[Respawn process dumped core]
pattern=heartbeat,ERROR:,Managed,process,dumped core
func=respawn_dumped_core
loglevel=WARN
#MsgNo.10-5
[Respawn process went away]
pattern=heartbeat,ERROR:,Managed,process,went away strangely
func=respawn_went_away
loglevel=WARN
#MsgNo.10-6
[Respawn process exited normally]
pattern=heartbeat,info:,killing,process group,with signal
func=respawn_exited_normally
#MsgNo.10-7
[Respawning too fast in a short term]
pattern=heartbeat,ERROR:,Client,respawning too fast
func=respawn_too_fast
###
# For Fail Over. These are only for DC node.
##
#MsgNo.F0-1, F9-1, F10-1
[Detect calculation starts]
pattern=crmd,info:,do_state_transition:,State transition,S_IDLE -> S_POLICY_ENGINE,!I_SHUTDOWN
func=detect_pe_calc
loglevel=WARN
#MsgNo.F0-2, F12-1, F12-2
[FailOver complete]
pattern_idle=crmd,info:,do_state_transition:,State transition,-> S_IDLE
pattern_stopping=crmd,info:,do_state_transition:,State transition,-> S_STOPPING
func=detect_fo_complete
loglevel=WARN
#MsgNo.F1-1, F1-2, F2-1, F2-2, F3-1, F3-2, F4-1, F4-2, F6-1, F6-2
[Action failure]
pattern=crmd,WARN:,update_failcount:,Updating failcount for
func=dc_detect_failure
loglevel=WARN
fotrigger=1
#MsgNo.F7-1, F7-2, F7-3, F7-4, F8-1
[Node failure]
pattern_shut=crmd,WARN:,match_down_event:,No match for shutdown action on
func=dc_detect_node_failure
fotrigger=3
#MsgNo.F11-1
#The message is not output immediately, output when F/O is complete.
[Add Resource start action]
pattern=pengine,notice:,LogActions: Start
func=add_rsc_start
#MsgNo.F11-2
#The message is not output immediately, output when F/O is complete.
[Add Resource stop action]
pattern=pengine,notice:,LogActions: Stop
func=add_rsc_stop
#MsgNo.F11-3, F11-4, F11-8, F11-9
#The message is not output immediately, output when F/O is complete.
[Add no action]
pattern_leave_start=pengine,notice:,LogActions: Leave
pattern_recover=pengine,notice:,LogActions: Recover
pattern_restart=pengine,notice:,LogActions: Restart
func=add_no_action
#MsgNo.F11-5
#The message is not output immediately, output when F/O is complete.
[Detect resource unmanaged]
pattern=pengine,info:,native_color:,Unmanaged resource,allocated to
func=detect_rsc_unmanaged
#MsgNo.F11-6
#The message is not output immediately, output when F/O is complete.
[Add Resource move action]
pattern=pengine,notice:,LogActions: Move
func=add_rsc_move
#Msg No.F11-10
#The message is not output immediately, output when F/O is complete.
[Resource initiating action]
pattern=crmd,info:,te_rsc_command:,Initiating action,!probe_complete
func=rsc_init_action
###
# For DC election.
###
#Msg No.13-2
[DC election is complete]
pattern=crmd,info:,update_dc:,Set DC to
func=dc_election_complete
#Msg No.13-5
[Detect unset DC]
pattern=crmd,info:,update_dc:,Unset DC
func=detect_unset_dc
###
# For Corosync service shutdown.
###
#Msg No.14-1 (only for DC)
[Corosync on the node in the cluster want to shutdown]
pattern=crmd,info:,handle_shutdown_request:,Creating shutdown request for
func=detect_shutdown_request
#Msg No.14-2
[Heartbeat shutdown complete.]
pattern=heartbeat,info:,Heartbeat shutdown complete
func=detect_hb_shutdown
#Msg No.14-3
[Pacemaker is shutting down.]
pattern=crmd,info:,crm_shutdown: Requesting shutdown
func=detect_pcmk_shutting_down
#Msg No.14-4 (for DC node shutdown)
[DC node want to shutdown]
pattern=cib,info:,cib_process_shutdown_req:,Shutdown REQ from
func=detect_dc_shutdown_request
###
# For logging daemon event.
###
#Msg No.15-1
[Detect logd started]
pattern=logd,info:,logd started with
func=output_original_log
#Msg No.16-1
[logd is shutting down.]
pattern=logd,info:,logd_term_write_action:,received
func=output_static_msg
#Msg No.16-2
[logd stopped.]
pattern=logd,info:,Exiting write process
func=output_static_msg
###
# For STONITH resource operation timed out.
###
#For Msg No.17-4, 19-3
#The message is not output immediately, output when operation complete.
[Resource operation timed out for stonith]
pattern=stonithd,WARN:,process,timed out,try,Killing with signal
func=detect_rscop_timedout_stonithd
###
# For fence operation.
###
#Msg No.20-1, No21-1
[fence operation start]
pattern=stonithd,info:,stonith_operate_locally,sending fencing op,for,to
func=fence_op_started
#Msg No.20-2
[fence operation succeeded]
pattern=stonithd,info:,Succeeded to STONITH the node
func=fence_op_succeeded
#Msg No.20-3, 21-3
[fence operation failed]
pattern=stonithd,info:,failed to STONITH node,with local device
func=fence_op_failed
loglevel=ERROR
#Msg No.20-4, 21-4
[fence operation timedout]
pattern=stonithd,ERROR:,Failed to STONITH the node,optype,op_result,TIMEOUT
func=fence_op_timedout
###
# For attribute event.
###
#Msg No.22-1
[Detect attribute updated]
pattern=attrd,info:,attrd_perform_update:,Sent update,!fail-count-,!last-failure-,!probe_complete,!shutdown,!master-
func=detect_attr_updated
#Msg No.22-2
[Detect attribute deleted]
pattern=attrd,info:,attrd_perform_update:,Sent delete,!delete -,!fail-count-,!last-failure-,!probe_complete,!shutdown,!master-
func=detect_attr_deleted
#Msg No.22-3
[Detect cib updated]
pattern=crmd,info:,abort_transition_graph:,tag=nvpair,Transient attribute: update
func=detect_cib_updated
###
# For Heartbeat service starts.
###
#Msg No.23-1
[Detect heartbeat is starting]
pattern=heartbeat,info:,Configuration validated,Starting heartbeat
func=detect_hb_start
#Msg No.23-3
#It's just for clear ConvertStatus. Output nothing.
[Detect localhost status is set to up]
pattern=heartbeat,info:,Local status now set to,up
func=detect_localstat_up
ignoremsg=True
###
# For log message dropping.
###
#Msg No.25-1
[Detect log dropped]
pattern=ERROR:,cl_log:,messages were dropped
func=output_original_log
###
# For Core process event.
###
#Msg No.28-1
[FIFO process start to restart]
pattern=heartbeat,WARN:,Restarting,process
func=output_original_log
#Msg No.28-2
[FIFO process restart failed]
pattern=heartbeat,ERROR:,restart failed,Restarting heartbeat
func=output_original_log
#Msg No.28-3
[I/O processes failed]
pattern=heartbeat,ERROR:,process died,Beginning communications restart process for comm channel
func=output_original_log
loglevel=WARN
#Msg No.28-4
[I/O processes start to restart]
pattern=heartbeat,ERROR:,Both comm processes for channel,have died,Restarting
func=output_original_log
loglevel=WARN
#Msg No.28-5
[I/O processes restart succeeded]
pattern=heartbeat,info:,Communications restart succeeded
func=output_original_log
#Msg No.28-6
[I/O processes failed to restart]
pattern=heartbeat,ERROR:,Communications restart failed,Will try again later
func=output_original_log
###
# For pengine event.
###
#Msg No.29-1
[pengine start]
pattern=crmd,info:,start_subsystem:,Starting sub-system
func=crmd_subsystem_start
#Msg No.29-2
[pengine exit]
pattern=crmd,info:,crmdManagedChildDied:,Process,exited \(signal=0,exitcode=
func=crmd_subsystem_exit
#Msg No.29-3
[pengine kill]
pattern=crmd,info:,crmdManagedChildDied:,Process,exited \(signal=,exitcode=,!\(signal=0
func=crmd_subsystem_kill
loglevel=ERROR
###
# Other process's failure
###
#Msg No.30-1
[master control process failure]
pattern=heartbeat,CRIT:,Emergency Shutdown:,Master Control process died
func=output_original_log
loglevel=ERROR
#Msg No.30-2
[OS reboot because of process's failure]
pattern=heartbeat,EMERG:,Rebooting system,Reason:
func=output_original_log
loglevel=ERROR
###
# Others.
###
#Msg No.27-1
[Detect a request for getting DC node state]
pattern=crmd,info:,handle_request:,Current ping state:
func=detect_dcstat_req
ignoremsg=True