[Linux-HA] simple ip failover problem

Guochun Shi gshi at ncsa.uiuc.edu
Wed Oct 12 10:07:08 MDT 2005


One more thing, ipfail does not work with 2.x version (yet)
So you need to remove ipfail from ha.cf

-Guochun

At 10:34 AM 10/12/2005 -0500, you wrote:
>check out: 
>http://www.gossamer-threads.com/lists/linuxha/users/28207
>
>-Guochun
>
>At 03:12 PM 10/11/2005 +0200, you wrote:
>>Content-class: urn:content-classes:message
>>Content-Type: multipart/signed; protocol="application/x-pkcs7-signature";
>>        micalg=SHA1;
>>        boundary="=_pbote2.srv.dsh.at-2487-1129036352-0001-2"
>>
>>Hi!
>>We use heartbeat 1.x for several years now for our RedHat based firewall
>>distro.
>>I try to convert our current config to 2.x and have problems to do so.
>>
>>Using IPaddr2 doesn't work, because I get the error:
>>Oct 11 14:46:30 hbtest1 lrmd: [6989]: ERROR: Process 6994 failed to redirect
>>stdout for its background child (daemon) processes. This will likely cause
>>those processes to die mysteriously at some later time (terminated by signal
>>SIGPIPE).
>>
>>When using IPaddr I have to kill the process '/bin/sh 
>>/usr/lib/ocf/resource.d//heartbeat/IPaddr start' to be able to stop heartbeat 
>>cause it hangs.
>>
>>Here are my current config files:
>>
>>/etc/ha.d/ha.cf
>>
>>#logfacility    local0
>>#keepalive 2
>>#deadtime 10
>>#initdead 20
>># heartbeat communication-port
>>udpport         694
>># heartbeat communication.interface
>>#bcast          eth1
>>ucast           eth1    10.30.8.93
>>
>>auto_failback   on
>>
>>crm             yes
>>use_logd        on
>>
>>respawn         hacluster       /usr/lib/heartbeat/ipfail
>>ping            10.30.8.90
>>
>># heartbeat nodes
>>node            hbtest1.srv.dsh.at
>>node            hbtest2.srv.dsh.at
>>
>>
>>
>>/var/lib/heartbeat/crm/cib.xml:
>>
>><cib dc_uuid="bf4c20b8-6131-4c6d-8f10-3a512e012fa1" cib_feature_revision="1" 
>>admin_epoch="0" epoch="9" num_updates="109" have_quorum="true" 
>>last_written="Tue Oct 11 15:08:25 2005
>>" generated="true" num_peers="1" origin="hbtest1.srv.dsh.at" 
>>debug_source="finalize_join" ccm_transition="1">
>>   <configuration>
>>     <crm_config>
>>       <nvpair id="transition_idle_timeout" name="transition_idle_timeout" 
>>value="20s"/>
>>       <nvpair id="symmetric_cluster" name="symmetric_cluster" value="true"/>
>>       <nvpair id="stonith_enabled" name="stonith_enabled" value="false"/>
>>       <nvpair id="no_quorum_policy" name="no_quorum_policy" value="stop"/>
>>       <nvpair id="suppress_cib_writes" name="suppress_cib_writes" 
>>value="false"/>
>>       <nvpair id="default_resource_stickiness" 
>>name="default_resource_stickiness" value="INFINITY"/>
>>       <nvpair id="require_quorum" name="require_quorum" value="true"/>
>>     </crm_config>
>>     <nodes>
>>       <node id="bf4c20b8-6131-4c6d-8f10-3a512e012fa1" 
>>uname="hbtest1.srv.dsh.at" type="member"/>
>>     </nodes>
>>     <resources>
>>       <group id="group_1">
>>         <primitive id="IPaddr_1" class="ocf" type="IPaddr" 
>>provider="heartbeat">
>>           <operations>
>>             <op id="1" name="monitor" interval="5s" timeout="3s"/>
>>           </operations>
>>           <instance_attributes>
>>             <attributes>
>>               <nvpair id="1" name="ip" value="10.30.8.93"/>
>>             </attributes>
>>           </instance_attributes>
>>         </primitive>
>>       </group>
>>     </resources>
>>     <constraints>
>>       <rsc_location id="rsc_location_group_1" rsc="group_1">
>>         <rule id="prefered_location_group_1" score="100">
>>           <expression id="1" attribute="#uname" operation="eq" 
>>value="hbtest1.srv.dsh.at"/>
>>         </rule>
>>       </rsc_location>
>>     </constraints>
>>   </configuration>
>>   <status>
>>     <node_state id="bf4c20b8-6131-4c6d-8f10-3a512e012fa1" 
>>uname="hbtest1.srv.dsh.at" in_ccm="true" join="member" origin="do_lrm_query" 
>>crmd="online" ha="active" expected="member"
>>>
>>       <lrm>
>>         <lrm_resources>
>>           <lrm_resource id="group_1:IPaddr_1" last_op="stop" 
>>rsc_state="stopped" rc_code="0" op_status="0">
>>             <lrm_rsc_op id="group_1:IPaddr_1_start_0" operation="start" 
>>origin="do_update_resource" 
>>transition_key="0:68c9ef46-ab25-4479-8fc5-545f249c3535" transition_magic="0:0:
>>68c9ef46-ab25-4479-8fc5-545f249c3535" rsc_state="running" call_id="2" 
>>rc_code="0" op_status="0"/>
>>             <lrm_rsc_op id="group_1:IPaddr_1_stop_0" operation="stop" 
>>origin="do_update_resource" 
>>transition_key="5:68c9ef46-ab25-4479-8fc5-545f249c3535" 
>>transition_magic="0:5:68
>>c9ef46-ab25-4479-8fc5-545f249c3535" rsc_state="stopped" call_id="7" 
>>rc_code="0" op_status="0"/>
>>           </lrm_resource>
>>         </lrm_resources>
>>       </lrm>
>>     </node_state>
>>   </status>
>> </cib>
>>
>>
>>/var/log/cluster.log is attached.
>>
>>With best regards
>>Alexander Hartmaier
>>
>>T-Systems Austria GesmbH
>>Rennweg 97-99
>>A-1030 Vienna
>>
>>
>>
>>
>>_______________________________________________
>>Linux-HA mailing list
>>Linux-HA at lists.linux-ha.org
>>http://lists.linux-ha.org/mailman/listinfo/linux-ha
>>See also: http://linux-ha.org/ReportingProblems 
>
>_______________________________________________
>Linux-HA mailing list
>Linux-HA at lists.linux-ha.org
>http://lists.linux-ha.org/mailman/listinfo/linux-ha
>See also: http://linux-ha.org/ReportingProblems




More information about the Linux-HA mailing list