[Linux-HA] Resources fail to start during single node startup/reboot

Lasantha Marian Mon, 15 Jun 2009 07:55:37 -0700

Hi,

I have a two node cluster setup using Heartbeat 2.99.3/Pacemaker 1.0.2
on an Ubuntu 8.10 server built on two identical Dell 2900 servers.
Basically Heartbeat works as expected. My configuration uses CRM to
manage and DRBD for storages.


I have noticed the following.

If node A is running and when node node B has failed, and then if node A
is rebooted (whilst node B still reaming failed), all the resources on
the node A would not start. Is this the expected behavior ? But I was
expecting node A to bring all resources up even when node B is being
temporarily unavailable. Can this be achieved ?

If both nodes (A and B) are started again, all resources come up correctly.

In the log it mostly shows "WARN: native_color: Resource dr0:1 cannot
run anywhere" and similar.

Any help/explanation is appreciated.

Best regards,

Lasantha.

primitive dr0 ocf:heartbeat:drbd \
        params drbd_resource="www" \
        op monitor interval="59s" role="Master" timeout="30s" \
        op monitor interval="60s" role="Slave" timeout="30s"
primitive dr1 ocf:heartbeat:drbd \
        params drbd_resource="spool" \
        op monitor interval="59s" role="Master" timeout="30s" \
        op monitor interval="60s" role="Slave" timeout="30s"
primitive dr3 ocf:heartbeat:drbd \
        params drbd_resource="data" \
        op monitor interval="59s" role="Master" timeout="30s" \
        op monitor interval="60s" role="Slave" timeout="30s"
primitive fs0 ocf:heartbeat:Filesystem \
        params fstype="ext3" directory="/ha/www" device="/dev/drbd0" 
options="rw,relatime"
primitive fs1 ocf:heartbeat:Filesystem \
        params fstype="ext3" directory="/ha/spool" device="/dev/drbd1" 
options="rw,relatime"
primitive fs3 ocf:heartbeat:Filesystem \
        params fstype="ext3" directory="/ha/data" device="/dev/drbd3" 
options="rw,relatime"
primitive ip0 ocf:heartbeat:IPaddr2 \
        params ip="192.168.0.180" broadcast="192.168.0.255" nic="bond0" 
iflabel="0" cidr_netmask="24" \
        op monitor interval="21s" timeout="5s"
primitive pg0 ocf:heartbeat:pgsql \
        params pgctl="/usr/local/PostgreSQL/bin/pg_ctl" 
psql="/usr/local/PostgreSQL/bin/psql" pgdata="/ha/data/PostgreSQL" 
pgdba="postgresql" pgport="5432" pgdb="template1" \
        op monitor interval="10s" timeout="10s"
group rg0 fs0 fs1 fs3 ip0 pg0
ms ms0 dr0 \
        meta clone-max="2" notify="true" globally-unique="false" 
target-role="Started"
ms ms1 dr1 \
        meta clone-max="2" notify="true" globally-unique="false" 
target-role="Started"
ms ms3 dr3 \
        meta clone-max="2" notify="true" globally-unique="false" 
target-role="Started"
location ms0-master-on-connected-node ms0 \
        rule $id="ms0-master-on-connected-node-rule" $role="master" -inf: 
not_defined pingd or pingd lte 0
location ms1-master-on-connected-node ms1 \
        rule $id="ms1-master-on-connected-node-rule" $role="master" -inf: 
not_defined pingd or pingd lte 0
location ms3-master-on-connected-node ms3 \
        rule $id="ms3-master-on-connected-node-rule" $role="master" -inf: 
not_defined pingd or pingd lte 0
colocation rg0-on-ms0 inf: rg0 ms0:Master
colocation rg0-on-ms1 inf: rg0 ms1:Master
colocation rg0-on-ms3 inf: rg0 ms3:Master
order ms0-before-rg0 inf: ms0:promote rg0:start
order ms1-before-rg0 inf: ms1:promote rg0:start
order ms3-before-rg0 inf: ms3:promote rg0:start
property $id="cib-bootstrap-options" \
        dc-version="1.0.2-c02b459053bfa44d509a2a0e0247b291d93662b7" \
        no-quorum-policy="ignore"

_______________________________________________
Linux-HA mailing list
[email protected]
http://lists.linux-ha.org/mailman/listinfo/linux-ha
See also: http://linux-ha.org/ReportingProblems

[Linux-HA] Resources fail to start during single node startup/reboot

Reply via email to