Hi ,
We are having a node two cluster with manual fencing configuration . One of the node died because of some hardware issue and we removed the dead node from the cluster using the following commands.
fence_manual -n db2.example.com
fence_ack_manual -n
db2.example.com
The faulty node is now recovered and we need to add this node back to cluster . We are trying to add the node using luci interface . But while adding the add using "Add a node " from the luci interface , the addition of node fails with the error that "that node is already a part of the cluster " . But the node name is not there in cluster.conf file .
===
cat /etc/cluster/cluster.conf
<?xml version="1.0"?>
<cluster alias="db" config_version="31" name="db">
<fence_daemon clean_start="0" post_fail_delay="0" post_join_delay="3"/>
<clusternodes>
<clusternode name="db1.example.com" nodeid="1" votes="1">
<fence/>
</clusternode>
</clusternodes>
<cman/>
<fencedevices/>
<rm>
<failoverdomains>
<failoverdomain name="DBFA-DM" nofailback="0" ordered="0" restricted="1">
<failoverdomainnode name="db1.example.com" priority="1"/>
</failoverdomain>
</failoverdomains>
<resources>
<postgres-8 config_file="/var/lib/pgsql/data/postgresql.conf" name="psql" postmaster_user="postgres" shutdown_wait="0"/>
<ip address="192.168.2.173" monitor_link="1"/>
<clusterfs device="/dev/db/dbgfs" force_unmount="1" fsid="48393" fstype="gfs" mountpoint="/var/lib/pgsql/" name="DB" self_fence="1"/>
<script file="/etc/init.d/postgresql" name="psql-db"/>
</resources>
<service autostart="1" domain="DBFA-DM" exclusive="1" name="DB" recovery="relocate">
<ip ref="192.168.2.173"/>
<clusterfs fstype="gfs" ref="DB"/>
<script ref="psql-db"/>
</service>
</rm>
<totem consensus="4800" join="60" token="10000" token_retransmits_before_loss_const="20"/>
</cluster>
====
<?xml version="1.0"?>
<cluster alias="db" config_version="31" name="db">
<fence_daemon clean_start="0" post_fail_delay="0" post_join_delay="3"/>
<clusternodes>
<clusternode name="db1.example.com" nodeid="1" votes="1">
<fence/>
</clusternode>
</clusternodes>
<cman/>
<fencedevices/>
<rm>
<failoverdomains>
<failoverdomain name="DBFA-DM" nofailback="0" ordered="0" restricted="1">
<failoverdomainnode name="db1.example.com" priority="1"/>
</failoverdomain>
</failoverdomains>
<resources>
<postgres-8 config_file="/var/lib/pgsql/data/postgresql.conf" name="psql" postmaster_user="postgres" shutdown_wait="0"/>
<ip address="192.168.2.173" monitor_link="1"/>
<clusterfs device="/dev/db/dbgfs" force_unmount="1" fsid="48393" fstype="gfs" mountpoint="/var/lib/pgsql/" name="DB" self_fence="1"/>
<script file="/etc/init.d/postgresql" name="psql-db"/>
</resources>
<service autostart="1" domain="DBFA-DM" exclusive="1" name="DB" recovery="relocate">
<ip ref="192.168.2.173"/>
<clusterfs fstype="gfs" ref="DB"/>
<script ref="psql-db"/>
</service>
</rm>
<totem consensus="4800" join="60" token="10000" token_retransmits_before_loss_const="20"/>
</cluster>
====
Please suggest how to resolve the issue .
Thanks
Zaman
-- Linux-cluster mailing list Linux-cluster@xxxxxxxxxx https://www.redhat.com/mailman/listinfo/linux-cluster