[Pacemaker] Master/Slave resource cannot start

Diego Remolina diego.remolina at physics.gatech.edu
Tue Aug 11 12:21:26 EDT 2009


> Solution:
> 1) clone the pingd
> 2) Delete you colocation constraint. It is useless.
> 3) Make a location constatint the allows the ip address only run on a node 
> that gets points from the pingd.

I want to thank Michael for pointing out my mistake. I have also 
migrated away from using heartbeat to openais.

I have noticed that more often than not after a node is rebooted, 
openais starts, but crm fails to start correctly. I usually have to kill 
it with pkill -9 aisexec, then start it again and then it usually works 
fine.

In any case, here is my final configuration which works for 2 drbd 
resources to run a file server with nfs and samba.

[root at phys-file01 ~]# crm configure show
node phys-file01.physics.gatech.edu
node phys-file02.physics.gatech.edu
primitive drbd_export ocf:linbit:drbd \
         params drbd_resource="export" \
         op monitor interval="59s" role="Master" timeout="30s" \
         op monitor interval="60s" role="Slave" timeout="30s"
primitive drbd_scratch ocf:linbit:drbd \
         params drbd_resource="scratch" \
         op monitor interval="59s" role="Master" timeout="30s" \
         op monitor interval="60s" role="Slave" timeout="30s"
primitive fs_export ocf:heartbeat:Filesystem \
         params type="ext4dev" device="/dev/drbd0" 
directory="/export/data" options="rw,user_xattr,acl,usrquota,grpquota"
primitive fs_scratch ocf:heartbeat:Filesystem \
         params type="ext4dev" device="/dev/drbd1" 
directory="/export/scratch" options="rw,user_xattr,acl,usrquota,grpquota"
primitive nfs lsb:nfs \
         op monitor interval="30s"
primitive pingd ocf:pacemaker:pingd \
         params host_list="130.207.139.1" multiplier="100" \
         op monitor interval="10s" timeout="5"
primitive samba lsb:smb \
         op monitor interval="30s"
primitive virtual-ip-1 ocf:heartbeat:IPaddr2 \
         params ip="130.207.139.20" cidr_netmask="24"
group fileserver fs_export fs_scratch virtual-ip-1 nfs samba
ms ms-drbd_export drbd_export \
         meta clone_max="2" clone_node_max="1" master_max="1" 
master_node_max="1" notify="true"
ms ms-drbd_scratch drbd_scratch \
         meta clone_max="2" clone_node_max="1" master_max="1" 
master_node_max="1" notify="true"
clone pingd-clone pingd \
         params pingd-dampen="5s" pingd-multiplier="100" 
ping-hosts="130.207.139.1"
location drbd-fence-by-handler-ms-drbd_export ms-drbd_export \
         rule $id="drbd-fence-by-handler-rule-ms-drbd_export" 
$role="Master" -inf: #uname ne phys-file01.physics.gatech.edu
location drbd-fence-by-handler-ms-drbd_scratch ms-drbd_scratch \
         rule $id="drbd-fence-by-handler-rule-ms-drbd_scratch" 
$role="Master" -inf: #uname ne phys-file01.physics.gatech.edu
location ms-drbd_export-on-connected-node ms-drbd_export \
         rule $id="ms-drbd_export-on-connected-node-rule" $role="Master" 
-inf: not_defined pingd or pingd lte 0
colocation fileserver-on-ms-drbd_export inf: fileserver 
ms-drbd_export:Master
colocation ms-drbd_scratch-on-ms-drbd_export inf: ms-drbd_scratch:Master 
ms-drbd_export:Master
order ms-drbd_export-before-fileserver inf: ms-drbd_export:promote 
fileserver:start
order ms-drbd_scratch-before-fileserver inf: ms-drbd_scratch:promote 
fileserver:start
property $id="cib-bootstrap-options" \
         dc-version="1.0.4-6dede86d6105786af3a5321ccf66b44b6914f0aa" \
         cluster-infrastructure="openais" \
         expected-quorum-votes="2" \
         no-quorum-policy="ignore" \
         last-lrm-refresh="1250006912"
property $id="cib-bootstrap-options-stonith-enabled" \
         stonith-enabled="false"


Diego



More information about the Pacemaker mailing list