I forget mention the version I used. <br>I used SLES11-SP1-HAE Beta5<br>Pacemaker 1.0.7<br>Corosync 1.2.0<br>Cluster Glue 1.0.3<br><br><br><div class="gmail_quote">2010/5/14 Javen Wu <span dir="ltr"><<a href="mailto:wu.javen@gmail.com">wu.javen@gmail.com</a>></span><br>
<blockquote class="gmail_quote" style="margin: 0pt 0pt 0pt 0.8ex; border-left: 1px solid rgb(204, 204, 204); padding-left: 1ex;">Hi Folks,<br><br>I setup a three nodes cluster with SBD STONITH configured.<br>After I manually isolate one node by running "ifconfig eth1 down" on the node. The node is fenced as expected.<br>
But after reboot, even the network is recovered, the node is killed again once I start openais&pacemaker.<br>
I saw the state of the node become from OFFLINE to ONLINE from `crm_mon -n` before being killed. And I saw SBD slot from reset->clear->reset.<br><br>I attached the syslog and corosync log.<br>And my CIB configuration is very simple.<br>

<br>Could you help me check what's the problem? In my mind, it's not expected behaviour.<br><br>===%<====CIB information=====================<br><br><cib validate-with="pacemaker-1.0" crm_feature_set="3.0.1" have-quorum="1" admin_epoch="0" epoch="349" num_updates="99" cib-last-written="Fri May 14 14:50:21 2010" dc-uuid="vm209"><br>

  <configuration><br>    <crm_config><br>      <cluster_property_set id="cib-bootstrap-options"><br>        <nvpair id="cib-bootstrap-options-dc-version" name="dc-version" value="1.1.1-530add2a3721a0ecccb24660a97dbfdaa3e68f51"/><br>

        <nvpair id="cib-bootstrap-options-cluster-infrastructure" name="cluster-infrastructure" value="openais"/><br>        <nvpair id="cib-bootstrap-options-expected-quorum-votes" name="expected-quorum-votes" value="3"/><br>

      </cluster_property_set><br>    </crm_config><br>    <nodes><br>      <node id="vm208" uname="vm208" type="normal"/><br>      <node id="vm209" uname="vm209" type="normal"/><br>

      <node id="vm210" uname="vm210" type="normal"/><br>    </nodes><br>    <resources><br>      <clone id="Fencing"><br>        <primitive class="stonith" id="sbd-fencing" type="external/sbd"><br>

          <instance_attributes id="sbd-fencing-instance_attributes"><br>            <nvpair id="sbd-fencing-instance_attributes-sbd_device" name="sbd_device" value="/dev/sdc"/><br>

          </instance_attributes><br>          <operations><br>            <op id="sbd-fencing-monitor-20s" interval="20s" name="monitor"/><br>          </operations><br>

        </primitive><br>      </clone><br>    </resources><br>    <constraints/><br>    <rsc_defaults/><br>    <op_defaults/><br>  </configuration><br>  <status><br>    <node_state id="vm209" uname="vm209" ha="active" in_ccm="true" crmd="online" join="member" expected="member" crm-debug-origin="post_cache_update" shutdown="0"><br>

      <transient_attributes id="vm209"><br>        <instance_attributes id="status-vm209"><br>          <nvpair id="status-vm209-probe_complete" name="probe_complete" value="true"/><br>

        </instance_attributes><br>      </transient_attributes><br>      <lrm id="vm209"><br>        <lrm_resources><br>          <lrm_resource id="sbd-fencing:0" type="external/sbd" class="stonith"><br>

            <lrm_rsc_op id="sbd-fencing:0_monitor_0" operation="monitor" crm-debug-origin="build_active_RAs" crm_feature_set="3.0.1" transition-key="4:1:7:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" transition-magic="0:7;4:1:7:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" call-id="2" rc-code="7" op-status="0" interval="0" last-run="1273820137" last-rc-change="1273820137" exec-time="60" queue-time="0" op-digest="4c3fd39434577fbb6540606d808ed050"/><br>

            <lrm_rsc_op id="sbd-fencing:0_start_0" operation="start" crm-debug-origin="build_active_RAs" crm_feature_set="3.0.1" transition-key="5:1:0:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" transition-magic="0:0;5:1:0:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" call-id="3" rc-code="0" op-status="0" interval="0" last-run="1273820137" last-rc-change="1273820137" exec-time="10" queue-time="0" op-digest="4c3fd39434577fbb6540606d808ed050"/><br>

            <lrm_rsc_op id="sbd-fencing:0_monitor_20000" operation="monitor" crm-debug-origin="build_active_RAs" crm_feature_set="3.0.1" transition-key="6:2:0:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" transition-magic="0:0;6:2:0:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" call-id="4" rc-code="0" op-status="0" interval="20000" last-run="1273822956" last-rc-change="1273820137" exec-time="1170" queue-time="0" op-digest="4029bbaef749649e82d602afb46dd872"/><br>

          </lrm_resource><br>        </lrm_resources><br>      </lrm><br>    </node_state><br>    <node_state id="vm208" uname="vm208" ha="dead" in_ccm="false" crmd="offline" crm-debug-origin="send_stonith_update" join="down" expected="down" shutdown="0"/><br>

    <node_state id="vm210" uname="vm210" ha="active" in_ccm="true" crmd="online" crm-debug-origin="post_cache_update" join="member" expected="member" shutdown="0"><br>

      <transient_attributes id="vm210"><br>        <instance_attributes id="status-vm210"><br>          <nvpair id="status-vm210-probe_complete" name="probe_complete" value="true"/><br>

        </instance_attributes><br>      </transient_attributes><br>      <lrm id="vm210"><br>        <lrm_resources><br>          <lrm_resource id="sbd-fencing:2" type="external/sbd" class="stonith"><br>

            <lrm_rsc_op id="sbd-fencing:2_monitor_0" operation="monitor" crm-debug-origin="build_active_RAs" crm_feature_set="3.0.1" transition-key="8:5:7:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" transition-magic="0:7;8:5:7:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" call-id="2" rc-code="7" op-status="0" interval="0" last-run="1273820388" last-rc-change="1273820388" exec-time="20" queue-time="0" op-digest="4c3fd39434577fbb6540606d808ed050"/><br>

            <lrm_rsc_op id="sbd-fencing:2_start_0" operation="start" crm-debug-origin="build_active_RAs" crm_feature_set="3.0.1" transition-key="13:5:0:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" transition-magic="0:0;13:5:0:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" call-id="3" rc-code="0" op-status="0" interval="0" last-run="1273820388" last-rc-change="1273820388" exec-time="10" queue-time="0" op-digest="4c3fd39434577fbb6540606d808ed050"/><br>

            <lrm_rsc_op id="sbd-fencing:2_monitor_20000" operation="monitor" crm-debug-origin="build_active_RAs" crm_feature_set="3.0.1" transition-key="14:5:0:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" transition-magic="0:0;14:5:0:f0adcb5c-10d1-4525-b094-b5ab1f776ee0" call-id="4" rc-code="0" op-status="0" interval="20000" last-run="1273822976" last-rc-change="1273820389" exec-time="1040" queue-time="0" op-digest="4029bbaef749649e82d602afb46dd872"/><br>

          </lrm_resource><br>        </lrm_resources><br>      </lrm><br>    </node_state><br>  </status><br></cib><br><br><br><br><br>
</blockquote></div><br><br clear="all"><br>-- <br>Javen Wu<br>