[Linux-cluster] rgmanager running, but cluster acts as if it's not

Ofer Inbar cos at aaaaa.org
Thu Aug 18 13:54:28 UTC 2011


[ cman-2.0.115-34, rgmanager-2.0.52-6, running on 5.5 ]

3-node cluster.  rgmanager is running on all three nodes, but service
won't relocate over to node 3.  clustat doesn't see rgmanager on it.
Run from nodes 1 and 2, clustat shows all three nodes Online but only
nodes 1 and 2 have rgmanager.  Run from node 3, clustat shows all
three Online and no rgmanager.  This is what I'd see if rgamanger were
not running on node3 at all.  And yet:

$ sudo /etc/init.d/rgmanager status
clurgmgrd (pid  2592) is running...
$ echo $?
0
$ ps aux | grep clu
root      2412  0.0  0.0  51920  1788 ?        S<sl 09:10   0:00 modclusterd
root      2592  0.0  0.0  23536  5132 ?        S<Ls 09:11   0:00 clurgmgrd
root      2593  0.0  0.0  23536   500 ?        S<   09:11   0:00 clurgmgrd

Restarting rgmanager succeeds but things are in the same broken state.

Nothing seems wrong in /var/log/messages:
Aug 18 08:54:07 node3 kernel: dlm: Using TCP for communications
Aug 18 08:54:08 node3 kernel: dlm: connecting to 2
Aug 18 08:54:08 node3 kernel: dlm: connecting to 1
Aug 18 08:54:08 node3 kernel: dlm: got connection from 1
Aug 18 08:54:08 node3 kernel: dlm: got connection from 2

However, strace shows process 2593 (the second clurgmgrd) in a nonstop
loop of SIGCHLD, rt_sigaction, rt_sigprocmask, clone, wait4.  That is
not what clurgmgrd processes on the other nodes look like.


Next, I tried fencing the node.  It shut down, rebooted, came back up,
rejoined the cluster, started rgmanager... and is *still* in this same
bad state!

I'm attaching lsof output for both clurgmgrd processes, and a sample
of the strace from the second process.  It looks the same after
fencing as it did before.

Any ideas?
  -- Cos
-------------- next part --------------
Aug 18 08:54:07 node3 kernel: dlm: Using TCP for communications
Aug 18 08:54:08 node3 kernel: dlm: connecting to 2
Aug 18 08:54:08 node3 kernel: dlm: connecting to 1
Aug 18 08:54:08 node3 kernel: dlm: got connection from 1
Aug 18 08:54:08 node3 kernel: dlm: got connection from 2

$ sudo lsof -p 19330
COMMAND     PID USER   FD   TYPE DEVICE    SIZE    NODE NAME
clurgmgrd 19330 root  cwd    DIR  253,0    4096       2 /
clurgmgrd 19330 root  rtd    DIR  253,0    4096       2 /
clurgmgrd 19330 root  txt    REG  253,0  258408 1706604 /usr/sbin/clurgmgrd
clurgmgrd 19330 root  mem    REG  253,0  139416 1882071 /lib64/ld-2.5.so
clurgmgrd 19330 root  mem    REG  253,0 1717800 1882072 /lib64/libc-2.5.so
clurgmgrd 19330 root  mem    REG  253,0  615136 1882073 /lib64/libm-2.5.so
clurgmgrd 19330 root  mem    REG  253,0   23360 1882075 /lib64/libdl-2.5.so
clurgmgrd 19330 root  mem    REG  253,0  145824 1882074 /lib64/libpthread-2.5.so
clurgmgrd 19330 root  mem    REG  253,0   85608 1695743 /usr/lib64/libz.so.1.2.3
clurgmgrd 19330 root  mem    REG  253,0   22136 1706606 /usr/lib64/libcman.so.2.0.115
clurgmgrd 19330 root  mem    REG  253,0 1297104 1706630 /usr/lib64/libxml2.so.2.6.26
clurgmgrd 19330 root  mem    REG  253,0   23576 1706612 /usr/lib64/libdlm.so.2.0.115
clurgmgrd 19330 root  mem    REG  253,0  902744 1706540 /usr/lib64/libslang.so.2.0.6
clurgmgrd 19330 root    0u   CHR    1,3            1275 /dev/null
clurgmgrd 19330 root    1u   CHR    1,3            1275 /dev/null
clurgmgrd 19330 root    2u   CHR    1,3            1275 /dev/null

$ sudo lsof -p 19331
COMMAND     PID USER   FD   TYPE             DEVICE    SIZE     NODE NAME
clurgmgrd 19331 root  cwd    DIR              253,0    4096        2 /
clurgmgrd 19331 root  rtd    DIR              253,0    4096        2 /
clurgmgrd 19331 root  txt    REG              253,0  258408  1706604 /usr/sbin/clurgmgrd
clurgmgrd 19331 root  mem    REG              253,0  139416  1882071 /lib64/ld-2.5.so
clurgmgrd 19331 root  mem    REG              253,0 1717800  1882072 /lib64/libc-2.5.so
clurgmgrd 19331 root  mem    REG              253,0  615136  1882073 /lib64/libm-2.5.so
clurgmgrd 19331 root  mem    REG              253,0   23360  1882075 /lib64/libdl-2.5.so
clurgmgrd 19331 root  mem    REG              253,0  145824  1882074 /lib64/libpthread-2.5.so
clurgmgrd 19331 root  mem    REG              253,0   85608  1695743 /usr/lib64/libz.so.1.2.3
clurgmgrd 19331 root  mem    REG              253,0   22136  1706606 /usr/lib64/libcman.so.2.0.115
clurgmgrd 19331 root  mem    REG              253,0 1297104  1706630 /usr/lib64/libxml2.so.2.6.26
clurgmgrd 19331 root  mem    REG              253,0   23576  1706612 /usr/lib64/libdlm.so.2.0.115
clurgmgrd 19331 root  mem    REG              253,0  902744  1706540 /usr/lib64/libslang.so.2.0.6
clurgmgrd 19331 root    0u   CHR                1,3             1275 /dev/null
clurgmgrd 19331 root    1u   CHR                1,3             1275 /dev/null
clurgmgrd 19331 root    2u   CHR                1,3             1275 /dev/null
clurgmgrd 19331 root    3u  unix 0xffff810174227140         31164635 socket
clurgmgrd 19331 root    4r   CHR                1,5             1277 /dev/zero
clurgmgrd 19331 root    5r  FIFO                0,6         31164637 pipe
clurgmgrd 19331 root    6w  FIFO                0,6         31164637 pipe
clurgmgrd 19331 root    7u   CHR              10,62             6413 /dev/misc/dlm-control
clurgmgrd 19331 root    8u   CHR              10,58         31164700 /dev/misc/dlm_rgmanager

$sudo strace -p 19331
Process 19331 attached - interrupt to quit
restart_syscall(<... resuming interrupted call ...>) = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24090
wait4(24090, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24090
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24093
wait4(24093, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24093
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24095
wait4(24095, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24095
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24097
wait4(24097, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24097
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24099
wait4(24099, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24099
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24101
wait4(24101, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24101
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24104
wait4(24104, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24104
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24106
wait4(24106, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24106
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24108
wait4(24108, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24108
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0}, {1, 0})               = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x301ce302d0}, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, 8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD, parent_tidptr=0x7fff59f75318) = 24116
wait4(24116, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 24116
rt_sigaction(SIGINT, {0x40c46c, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x301ce302d0}, NULL, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
rt_sigprocmask(SIG_BLOCK, [CHLD], ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], 8) = 0
rt_sigaction(SIGCHLD, NULL, {SIG_DFL, [], 0}, 8) = 0
rt_sigprocmask(SIG_SETMASK, ~[INT QUIT ILL TRAP ABRT BUS FPE KILL USR1 SEGV PIPE TERM CHLD STOP RTMIN RT_1], NULL, 8) = 0
nanosleep({1, 0},


More information about the Linux-cluster mailing list