This is the log messages related to restarting oracle. to simulate oracle problems I kill pmon and removed initSCAPA1.ora after that it gets on this loop, executing oracledb.sh over and over perhaps there's a param Im missing on cluster.conf? ( its pasted after ) Mar 18 15:52:05 dc1-x6250-a oracledb.sh: Restarting Oracle Database... Mar 18 15:52:05 dc1-x6250-a cat: Mar 18 15:52:05 dc1-x6250-a cat: SQL*Plus: Release 11.1.0.7.0 - Production on Thu Mar 18 15:52:05 2010 Mar 18 15:52:05 dc1-x6250-a cat: Mar 18 15:52:05 dc1-x6250-a cat: Copyright (c) 1982, 2008, Oracle. All rights reserved. Mar 18 15:52:05 dc1-x6250-a cat: Mar 18 15:52:05 dc1-x6250-a cat: Connected to an idle instance. Mar 18 15:52:05 dc1-x6250-a cat: Mar 18 15:52:05 dc1-x6250-a cat: SQL> ORACLE instance shut down. Mar 18 15:52:05 dc1-x6250-a cat: SQL> Disconnected Mar 18 15:52:05 dc1-x6250-a cat: Mar 18 15:52:05 dc1-x6250-a cat: SQL*Plus: Release 11.1.0.7.0 - Production on Thu Mar 18 15:52:05 2010 Mar 18 15:52:05 dc1-x6250-a cat: Mar 18 15:52:05 dc1-x6250-a cat: Copyright (c) 1982, 2008, Oracle. All rights reserved. Mar 18 15:52:05 dc1-x6250-a cat: Mar 18 15:52:05 dc1-x6250-a cat: Connected to an idle instance. Mar 18 15:52:05 dc1-x6250-a cat: Mar 18 15:52:05 dc1-x6250-a cat: SQL> ORA-01078: failure in processing system parameters Mar 18 15:52:05 dc1-x6250-a cat: LRM-00109: could not open parameter file 'initSCAPA1.ora' Mar 18 15:52:05 dc1-x6250-a cat: SQL> Disconnected Mar 18 15:52:35 dc1-x6250-a oracledb.sh: Restarting Oracle Database... cluster.conf <?xml version="1.0"?> <cluster alias="oracle_prod" config_version="40" name="oracle_prod"> <fence_daemon clean_start="1" post_fail_delay="100" post_join_delay="-1"/> <clusternodes> <clusternode name="dc2-x6250-a-cl.lux.eib.org" nodeid="1" votes="1"> <fence> <method name="1"> <device name="fence_dc2-x6250-a"/> </method> </fence> </clusternode> <clusternode name="dc1-x6250-a-cl.lux.eib.org" nodeid="2" votes="1"> <fence> <method name="1"> <device name="fence_dc1-x6250-a"/> </method> </fence> </clusternode> </clusternodes> <cman expected_votes="2" two_node="0"/> <fencedevices> <fencedevice agent="fence_ipmilan" ipaddr="172.26.240.3" login="root" name="fence_dc1-x6250-a" passwd="no7+WaYs"/> <fencedevice agent="fence_ipmilan" ipaddr="172.26.240.4" login="root" name="fence_dc2-x6250-a" passwd="no7+WaYs"/> </fencedevices> <rm> <failoverdomains> <failoverdomain name="scapa_failover_domain" nofailback="0" ordered="0" restricted="1"> <failoverdomainnode name="dc2-x6250-a-cl.lux.eib.org" priority="1"/> <failoverdomainnode name="dc1-x6250-a-cl.lux.eib.org" priority="1"/> </failoverdomain> <failoverdomain name="jura_failover_domain" nofailback="0" ordered="1" restricted="1"> <failoverdomainnode name="dc2-x6250-a-cl.lux.eib.org" priority="1"/> <failoverdomainnode name="dc1-x6250-a-cl.lux.eib.org" priority="2"/> </failoverdomain> </failoverdomains> <resources> <lvm lv_name="" name="scapa_resource" vg_name="vg_ora_scapa"/> <fs device="/dev/vg_ora_scapa/lv_ora_scapa_arch" force_fsck="0" force_unmount="0" fsid="2069" fstype="ext3" mountpoint="/app/oracle/scapa/archive" name="ora_scapa_arch" self_fence="0"/> <fs device="/dev/vg_ora_scapa/lv_ora_scapa_redo" force_fsck="0" force_unmount="0" fsid="2070" fstype="ext3" mountpoint="/app/oracle/scapa/redo" name="ora_scapa_redo" self_fence="0"/> <fs device="/dev/vg_ora_scapa/lv_ora_scapa_data" force_fsck="0" force_unmount="0" fsid="2071" fstype="ext3" mountpoint="/app/oracle/scapa/data" name="ora_scapa_data" self_fence="0"/> <fs device="/dev/vg_ora_scapa/lv_ora_scapa_export" force_fsck="0" force_unmount="0" fsid="2072" fstype="ext3" mountpoint="/app/oracle/scapa/export" name="ora_scapa_export" self_fence="0"/> <lvm lv_name="" name="jura_resource" vg_name="vg_ora_jura"/> <fs device="/dev/vg_ora_jura/lv_ora_jura_arch" force_fsck="0" force_unmount="0" fsid="2073" fstype="ext3" mountpoint="/app/oracle/jura/archive" name="ora_jura_arch" self_fence="0"/> <fs device="/dev/vg_ora_jura/lv_ora_jura_redo" force_fsck="0" force_unmount="0" fsid="2074" fstype="ext3" mountpoint="/app/oracle/jura/redo" name="ora_jura_redo" self_fence="0"/> <fs device="/dev/vg_ora_jura/lv_ora_jura_data" force_fsck="0" force_unmount="0" fsid="2075" fstype="ext3" mountpoint="/app/oracle/jura/data" name="ora_jura_data" self_fence="0"/> <fs device="/dev/vg_ora_jura/lv_ora_jura_export" force_fsck="0" force_unmount="0" fsid="2076" fstype="ext3" mountpoint="/app/oracle/jura/export" name="ora_jura_export" self_fence="0"/> <ip address="172.26.18.35" monitor_link="1"/> <ip address="172.26.18.37" monitor_link="1"/> <oracledb home="/app/oracle/u02/product/11.1.0.7" listener_name="listener_JURA1" name="JURA1" type="base" user="oracle"/> <oracledb home="/app/oracle/u02/product/11.1.0.7" listener_name="listener_SCAPA1" name="SCAPA1" type="base" user="oracle"/> </resources> <service autostart="0" domain="scapa_failover_domain" exclusive="0" name="scapa" recovery="relocate"> <ip ref="172.26.18.35"> <lvm ref="scapa_resource"> <fs ref="ora_scapa_arch"/> <fs ref="ora_scapa_redo"/> <fs ref="ora_scapa_data"/> <fs ref="ora_scapa_export"/> <oracledb ref="SCAPA1"/> </lvm> </ip> </service> <service autostart="1" domain="jura_failover_domain" exclusive="0" name="jura" recovery="relocate"> <ip ref="172.26.18.37"> <lvm ref="jura_resource"> <fs ref="ora_jura_arch"/> <fs ref="ora_jura_redo"/> <fs ref="ora_jura_data"/> <fs ref="ora_jura_export"/> <oracledb ref="JURA1"/> </lvm> </ip> </service> </rm> <totem consensus="4800" join="60" token="15000" token_retransmits_before_loss_const="20"/> <quorumd interval="2" label="OracleQuorum" tko="20" upgrade_wait="2" master_wait="2" votes="1" log_level="7" min_score="1" reboot="0" allow_kill="0" stop_cman="0" status_file="/tmp/QdiskStatus"> </quorumd> </cluster> > Could you post the full cluster.conf file?, and cluster logs in > /var/log/messages.... > > > > > > -----Original Message----- > From: linux-cluster-bounces@xxxxxxxxxx > [mailto:linux-cluster-bounces@xxxxxxxxxx] On Behalf Of jose nuno neto > Sent: Thursday, March 18, 2010 6:14 PM > To: linux clustering > Subject: oracledb.sh > > Hellos > > I'm setting up oracle has a failover service ( not RAC ) on rhcs > Set up seems ok, I can switch from one node to the other > But now I'm simulating failures and the /user/share/cluster/oracledb.sh > detects the fail but keeps trying to restart the service on the same node. > > To simulate fail e kill pmon and removed a conf file initSID.ora > > Dont have any special options for restarting service: > > <service autostart="0" domain="scapa_failover_domain" exclusive="0" > name="scapa" recovery="relocate"> > > How can I set it so It'll fail and relocate to the other node? > > Thanks > Jose > > -- > This message has been scanned for viruses and > dangerous content by MailScanner, and is > believed to be clean. > > -- > Linux-cluster mailing list > Linux-cluster@xxxxxxxxxx > https://www.redhat.com/mailman/listinfo/linux-cluster > > -- > Linux-cluster mailing list > Linux-cluster@xxxxxxxxxx > https://www.redhat.com/mailman/listinfo/linux-cluster > > -- > This message has been scanned for viruses and > dangerous content by MailScanner, and is > believed to be clean. > -- This message has been scanned for viruses and dangerous content by MailScanner, and is believed to be clean. -- Linux-cluster mailing list Linux-cluster@xxxxxxxxxx https://www.redhat.com/mailman/listinfo/linux-cluster