[Linux-cluster] DRAC5 fencing problem with Redhat 5.3 cluster

Dan Hayes dhayes501 at gmail.com
Wed Apr 22 17:00:30 UTC 2009


I have 8 Dell servers all loaded with Redhat 5.3.  The machines have an
external and internal IP address.  The cluster is configured on the internal
ip address.

The cluster appears to be working fine except for fencing.  I try to
manually fence a node, but get a connection error
[root at w002 ~]# fence_node lb001.domain.com
agent "fence_drac5" reports: Unable to connect/login to fencing device

I was able to get the fence_drac5 command to work directly by adding the
"-x" option for using SSH.  It says the connection times out, but it does
shut down the other machine
[root at w002 ~]# fence_drac5 -a 165.289.178.221 -l root -p pass -x
lb001.domain.com
Connection timed out

Why does the connection time out?  And how do I add the "-x" option to the
cluster.conf file so that the fencing agent can connect?

Here are my /etc/hosts and /etc/cluster/cluster.conf files.

##############################################/etc/hosts
127.0.0.1               localhost.localdomain localhost
::1             localhost6.localdomain6 localhost6

#eth0  --  p=public interface
165.289.178.111    w001p w001p.domain.com
165.289.178.112    w002p w002p.domain.com
165.289.178.113    w003p w003p.domain.com
165.289.178.121    lb001p lb001p.domain.com
165.289.178.122    lb002p lb002p.domain.com
165.289.178.124    db001p db001p.domain.com
165.289.178.125    db002p db002p.domain.com
165.289.178.126    dev001p dev001p.domain.com
165.289.178.211    w001-drac
165.289.178.212    w002-drac
165.289.178.213    w003-drac
165.289.178.221    lb001-drac
165.289.178.222    lb002-drac
165.289.178.224    db001-drac
165.289.178.225    db002-drac
165.289.178.226    dev001-drac

#eth1 --  this is the cluster
192.168.178.111    w001 w001.domain.com
192.168.178.112    w002 w002.domain.com
192.168.178.113    w003 w003.domain.com
192.168.178.121    lb001 lb001.domain.com
192.168.178.122    lb002 lb002.domain.com
192.168.178.124    db001 db001.domain.com
192.168.178.125    db002 db002.domain.com
192.168.178.126    dev001 dev001.domain.com
#########################################################



##################################/etc/cluster/cluster.conf
<?xml version="1.0"?>
<cluster alias="cluster1" config_version="1" name="cluster1">
        <fence_daemon post_fail_delay="0" post_join_delay="3"/>
        <clusternodes>
                <clusternode name="dev001.domain.com" nodeid="1" votes="1">
                     <fence><method name="1"> <device name="dev001-drac"/>
</method></fence>
                </clusternode>
                <clusternode name="w001.domain.com" nodeid="2" votes="1">
                     <fence><method name="1"> <device name="w001-drac"/>
</method></fence>
                </clusternode>
                <clusternode name="w002.domain.com" nodeid="3" votes="1">
                     <fence><method name="1"> <device name="w002-drac"/>
</method></fence>
                </clusternode>
                <clusternode name="w003.domain.com" nodeid="4" votes="1">
                     <fence><method name="1"> <device name="w003-drac"/>
</method></fence>
                </clusternode>
                <clusternode name="lb001.domain.com" nodeid="5" votes="1">
                     <fence><method name="1"> <device name="lb001-drac"/>
</method></fence>
                </clusternode>
                <clusternode name="lb002.domain.com" nodeid="6" votes="1">
                     <fence><method name="1"> <device name="lb002-drac"/>
</method></fence>
                </clusternode>
                <clusternode name="db001.domain.com" nodeid="7" votes="1">
                     <fence><method name="1"> <device name="db001-drac"/>
</method></fence>
                </clusternode>
                <clusternode name="db002.domain.com" nodeid="8" votes="1">
                     <fence><method name="1"> <device name="db002-drac"/>
</method></fence>
                </clusternode>
        </clusternodes>
        <cman/>
        <fencedevices>
            <fencedevice agent="fence_drac5" ipaddr="165.289.178.211"
login="root" name="w001-drac" passwd="pass"/>
            <fencedevice agent="fence_drac5" ipaddr="165.289.178.212"
login="root" name="w002-drac" passwd="pass"/>
            <fencedevice agent="fence_drac5" ipaddr="165.289.178.213"
login="root" name="w003-drac" passwd="pass/>
            <fencedevice agent="fence_drac5" ipaddr="165.289.178.221"
login="root" name="lb001-drac" passwd="pass"/>
            <fencedevice agent="fence_drac5" ipaddr="165.289.178.222"
login="root" name="lb002-drac" passwd="pass"/>
            <fencedevice agent="fence_drac5" ipaddr="165.289.178.224"
login="root" name="db001-drac" passwd="pass/>
            <fencedevice agent="fence_drac5" ipaddr="165.289.178.225"
login="root" name="db002-drac" passwd="pass"/>
            <fencedevice agent="fence_drac5" ipaddr="165.289.178.226"
login="root" name="dev001-drac" passwd="pass"/>
        </fencedevices>
        <rm/>
</cluster>
########################################################
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://listman.redhat.com/archives/linux-cluster/attachments/20090422/9783ed82/attachment.htm>


More information about the Linux-cluster mailing list