Hi,
today one DomU running mainly Apache, Typo3, MySQL went unusable.
Last message from Nagios:
Ram : 98%, Swap : 100% : 99, 90 : CRITICAL
Logging in with xm console I saw oom-killer messages and did an xm
destroy.
Is there any solution to automatically destroy and restart a DomU in
such a case?
The current crm config is as follows (only the relevant part of one
DomU):
xen11:/# crm configure show
node $id="xxx" xen11
node $id="yyy" xen10
primitive xen_drbd2_1 ocf:linbit:drbd \
params drbd_resource="drbd2_1" \
op monitor interval="15s" \
op start interval="0" timeout="240s" \
op stop interval="0" timeout="100s"
primitive xen_drbd2_2 ocf:linbit:drbd \
params drbd_resource="drbd2_2" \
op monitor interval="15s" \
op start interval="0" timeout="240s" \
op stop interval="0" timeout="100s"
primitive xen_typo3 ocf:heartbeat:Xen \
params xmfile="/etc/xen/typo3.cfg" \
op monitor interval="3s" timeout="30s" \
op start interval="0" timeout="60s" \
op stop interval="0" timeout="40s" \
meta target-role="Started" allow-migrate="false" is-managed="true"
group group_drbd2 xen_drbd2_1 xen_drbd2_2
ms DrbdClone2 group_drbd2 \
meta master_max="1" master-mode-max="1" clone-max="2" clone-node-
max="1" notify="true"
location cli-prefer-xen_typo3 xen_typo3 \
rule $id="cli-prefer-rule-xen_typo3" inf: #uname eq xen10
colocation xen_typo3_and_drbd inf: xen_typo3 DrbdClone2:Master
order xen_typo3_after_drbd inf: DrbdClone2:promote xen_typo3:start
property $id="cib-bootstrap-options" \
dc-version="1.0.9-74392a28b7f31d7ddc86689598bd23114f58978b" \
cluster-infrastructure="Heartbeat" \
stonith-enabled="false" \
no-quorum-policy="ignore" \
last-lrm-refresh="1331211005" \
maintenance-mode="false"
rsc_defaults $id="rsc-options" \
resource-stickiness="100"
TIA
Helmut Wollmersdorfer
_______________________________________________
Linux-HA mailing list
[email protected]
http://lists.linux-ha.org/mailman/listinfo/linux-ha
See also: http://linux-ha.org/ReportingProblems