2007-06-04 15:09:03 +10:00
#!/bin/sh
#################################
# interface event script for ctdb
# this adds/removes IPs from your
# public interface
2007-09-14 14:14:03 +10:00
. $CTDB_BASE/functions
2009-11-19 15:00:17 +11:00
loadconfig
2007-06-04 15:09:03 +10:00
2007-09-04 09:50:07 +10:00
[ -z "$CTDB_PUBLIC_ADDRESSES" ] && {
2007-09-14 14:14:03 +10:00
CTDB_PUBLIC_ADDRESSES=$CTDB_BASE/public_addresses
2007-06-11 08:42:51 +10:00
}
2007-06-04 15:09:03 +10:00
2007-09-04 09:50:07 +10:00
[ ! -f "$CTDB_PUBLIC_ADDRESSES" ] && {
exit 0
}
2007-06-04 15:09:03 +10:00
2011-06-28 15:53:54 +10:00
mark_up ()
{
2011-06-28 16:10:23 +10:00
up_interfaces_found=true
2011-06-28 15:53:54 +10:00
ctdb setifacelink $1 up >/dev/null 2>&1
}
mark_down ()
{
2011-06-28 16:10:23 +10:00
fail=true
2011-06-28 15:53:54 +10:00
ctdb setifacelink $1 down >/dev/null 2>&1
}
2011-07-05 17:18:30 +10:00
# This sets $all_interfaces as a side-effect.
get_all_interfaces ()
2009-12-14 11:59:45 +01:00
{
2011-07-05 17:18:30 +10:00
# Get all the interfaces listed in the public_addresses file
all_interfaces=$(sed -e "s/^[^\t ]*[\t ]*//" -e "s/,/ /g" -e "s/[\t ]*$//" $CTDB_PUBLIC_ADDRESSES)
2009-12-14 11:59:45 +01:00
2011-07-05 17:18:30 +10:00
# Add some special interfaces if they're defined
[ "$CTDB_PUBLIC_INTERFACE" ] && all_interfaces="$CTDB_PUBLIC_INTERFACE $all_interfaces"
[ "$CTDB_NATGW_PUBLIC_IFACE" ] && all_interfaces="$CTDB_NATGW_PUBLIC_IFACE $all_interfaces"
2009-12-14 11:59:45 +01:00
2011-07-05 17:18:30 +10:00
# For all but the 1st line, get the 2nd last field with commas
# changes to spaces.
ctdb_ifaces=$(ctdb -Y ip -v | sed -e '1d' -e 's/:[^:]*:$//' -e 's/^.*://' -e 's/,/ /g')
2009-12-22 15:25:30 +01:00
2011-07-05 17:18:30 +10:00
# Add $ctdb_interfaces and uniquify
all_interfaces=$(echo $all_interfaces $ctdb_ifaces | tr ' ' '\n' | sort -u)
}
2009-12-22 15:25:30 +01:00
2011-07-05 17:18:30 +10:00
monitor_interfaces()
{
get_all_interfaces
2009-12-14 11:59:45 +01:00
2011-06-28 16:10:23 +10:00
fail=false
up_interfaces_found=false
2009-12-22 15:25:30 +01:00
2011-06-28 16:50:47 +10:00
for iface in $all_interfaces ; do
ip addr show $iface 2>/dev/null >/dev/null || {
echo Interface $iface does not exist but it is used by public addresses.
2011-05-10 06:19:34 +10:00
continue
2009-12-22 15:25:30 +01:00
}
2009-12-14 11:59:45 +01:00
# These interfaces are sometimes bond devices
# When we use VLANs for bond interfaces, there will only
# be an entry in /proc for the underlying real interface
2011-06-28 16:50:47 +10:00
realiface=`echo $iface |sed -e 's/\..*$//'`
bi=$(get_proc "net/bonding/$realiface" 2>/dev/null) && {
2011-08-03 20:12:48 +10:00
echo "$bi" | grep -q 'Currently Active Slave: None' && {
2011-06-28 16:50:47 +10:00
echo "ERROR: No active slaves for bond device $realiface"
mark_down $iface
2011-06-28 17:07:39 +10:00
continue
2009-12-14 11:59:45 +01:00
}
2011-08-03 20:12:48 +10:00
echo "$bi" | grep -q '^MII Status: up' || {
2011-06-28 16:50:47 +10:00
echo "ERROR: public network interface $realiface is down"
mark_down $iface
2011-06-28 17:07:39 +10:00
continue
2009-12-14 11:59:45 +01:00
}
2011-08-03 20:12:48 +10:00
echo "$bi" | grep -q '^Bonding Mode: IEEE 802.3ad Dynamic link aggregation' && {
2011-06-28 17:07:39 +10:00
# This works around a bug in the driver where the
# overall bond status can be up but none of the actual
# physical interfaces have a link.
2011-08-03 20:12:48 +10:00
echo "$bi" | grep 'MII Status:' | tail -n +2 | grep -q '^MII Status: up' || {
2011-06-28 16:50:47 +10:00
echo No active slaves for 802.ad bond device $realiface
mark_down $iface
2011-04-13 07:51:36 +10:00
continue
}
}
2011-06-28 16:50:47 +10:00
mark_up $iface
2011-06-28 17:07:39 +10:00
continue
2009-12-14 11:59:45 +01:00
}
2011-06-28 16:50:47 +10:00
case $iface in
2010-06-01 14:51:09 +10:00
lo*)
# loopback is always working
2011-06-28 16:50:47 +10:00
mark_up $iface
2010-06-01 14:51:09 +10:00
;;
2009-12-14 11:59:45 +01:00
ib*)
# we dont know how to test ib links
2011-06-28 16:50:47 +10:00
mark_up $iface
2009-12-14 11:59:45 +01:00
;;
*)
2011-06-28 16:50:47 +10:00
[ -z "$iface" ] || {
[ "$(basename $(readlink /sys/class/net/$iface/device/driver) 2>/dev/null)" = virtio_net ] ||
ethtool $iface | grep -q 'Link detected: yes' || {
2009-12-14 11:59:45 +01:00
# On some systems, this is not successful when a
# cable is plugged but the interface has not been
# brought up previously. Bring the interface up and
# try again...
2011-06-28 16:50:47 +10:00
ip link set $iface up
ethtool $iface | grep -q 'Link detected: yes' || {
echo "ERROR: No link on the public network interface $iface"
mark_down $iface
2009-12-14 11:59:45 +01:00
continue
}
}
2011-06-28 16:50:47 +10:00
mark_up $iface
2009-12-14 11:59:45 +01:00
}
;;
esac
done
2011-06-28 16:10:23 +10:00
$fail || return 0
2009-12-22 15:25:30 +01:00
2011-06-28 16:27:01 +10:00
$up_interfaces_found && \
[ "$CTDB_PARTIALLY_ONLINE_INTERFACES" = "yes" ] && \
return 0
2009-12-22 15:25:30 +01:00
2011-06-28 16:10:23 +10:00
return 1
2009-12-14 11:59:45 +01:00
}
2009-12-01 17:43:47 +11:00
case "$1" in
2007-06-04 15:09:03 +10:00
#############################
# called when ctdbd starts up
2010-01-19 10:07:14 +01:00
init)
2007-09-08 08:09:02 +10:00
# make sure that we only respond to ARP messages from the NIC where
# a particular ip address is associated.
2011-06-28 15:36:28 +10:00
get_proc sys/net/ipv4/conf/all/arp_filter >/dev/null 2>&1 && {
set_proc sys/net/ipv4/conf/all/arp_filter 1
2007-09-12 13:23:36 +10:00
}
2007-06-04 15:09:03 +10:00
;;
2009-12-22 15:25:30 +01:00
#############################
# called after ctdbd has done its initial recovery
# and we start the services to become healthy
startup)
2011-04-11 05:56:14 +10:00
# Assume all links are good initially
INTERFACES=`for IFACE in $INTERFACES ; do echo $IFACE ; done | sort | uniq`
for IFACE in $INTERFACES ; do
2011-05-09 06:35:33 +10:00
ctdb setifacelink $IFACE down >/dev/null 2>/dev/null
2011-04-11 05:56:14 +10:00
done
2009-12-22 15:25:30 +01:00
monitor_interfaces
;;
2007-06-04 15:09:03 +10:00
################################################
# called when ctdbd wants to claim an IP address
takeip)
2009-12-01 17:43:47 +11:00
if [ $# != 4 ]; then
2008-01-16 22:06:44 +11:00
echo "must supply interface, IP and maskbits"
2007-06-04 15:09:03 +10:00
exit 1
fi
2009-12-01 17:43:47 +11:00
iface=$2
ip=$3
maskbits=$4
2007-06-04 15:09:03 +10:00
2009-12-18 11:08:22 +01:00
add_ip_to_iface $iface $ip $maskbits || {
exit 1;
2007-06-04 15:09:03 +10:00
}
2009-12-18 11:08:22 +01:00
2007-09-13 10:24:48 +10:00
# cope with the script being killed while we have the interface blocked
2008-02-07 15:36:26 +11:00
iptables -D INPUT -i $iface -d $ip -j DROP 2> /dev/null
2007-06-04 15:09:03 +10:00
# flush our route cache
2011-06-28 15:36:28 +10:00
set_proc sys/net/ipv4/route/flush 1
2007-06-04 15:09:03 +10:00
;;
##################################################
# called when ctdbd wants to release an IP address
releaseip)
2009-12-01 17:43:47 +11:00
if [ $# != 4 ]; then
2008-01-16 22:06:44 +11:00
echo "must supply interface, IP and maskbits"
2007-06-04 15:09:03 +10:00
exit 1
fi
2007-09-13 10:24:48 +10:00
# releasing an IP is a bit more complex than it seems. Once the IP
# is released, any open tcp connections to that IP on this host will end
# up being stuck. Some of them (such as NFS connections) will be unkillable
# so we need to use the killtcp ctdb function to kill them off. We also
# need to make sure that no new connections get established while we are
# doing this! So what we do is this:
# 1) firewall this IP, so no new external packets arrive for it
# 2) use netstat -tn to find existing connections, and kill them
# 3) remove the IP from the interface
# 4) remove the firewall rule
2009-12-01 17:43:47 +11:00
iface=$2
ip=$3
maskbits=$4
2007-09-13 10:24:48 +10:00
failed=0
# we do an extra delete to cope with the script being killed
2008-02-07 15:36:26 +11:00
iptables -D INPUT -i $iface -d $ip -j DROP 2> /dev/null
iptables -I INPUT -i $iface -d $ip -j DROP
2007-09-13 10:24:48 +10:00
kill_tcp_connections $ip
2007-09-14 11:56:40 +10:00
2009-12-18 11:08:22 +01:00
delete_ip_from_iface $iface $ip $maskbits || {
iptables -D INPUT -i $iface -d $ip -j DROP 2> /dev/null
exit 1;
2007-09-14 11:56:40 +10:00
}
2009-12-18 11:08:22 +01:00
2009-09-02 03:12:27 +10:00
iptables -D INPUT -i $iface -d $ip -j DROP 2> /dev/null
2007-06-04 15:09:03 +10:00
# flush our route cache
2011-06-28 15:36:28 +10:00
set_proc sys/net/ipv4/route/flush 1
2007-06-04 15:09:03 +10:00
;;
2009-12-21 08:40:50 +01:00
##################################################
# called when ctdbd wants to update an IP address
updateip)
if [ $# != 5 ]; then
echo "must supply old interface, new interface, IP and maskbits"
exit 1
fi
# moving an IP is a bit more complex than it seems.
# First we drop all traffic on the old interface.
# Then we try to add the ip to the new interface and before
# we finally remove it from the old interface.
#
# 1) firewall this IP, so no new external packets arrive for it
# 2) add the IP to the new interface
# 3) remove the IP from the old interface
# 4) remove the firewall rule
# 5) use ctdb gratiousarp to propagate the new mac address
# 6) use netstat -tn to find existing connections, and tickle them
oiface=$2
niface=$3
ip=$4
maskbits=$5
failed=0
# we do an extra delete to cope with the script being killed
iptables -D INPUT -i $oiface -d $ip -j DROP 2> /dev/null
iptables -I INPUT -i $oiface -d $ip -j DROP
2010-11-10 14:45:43 +11:00
delete_ip_from_iface $oiface $ip $maskbits 2>/dev/null
delete_ip_from_iface $niface $ip $maskbits 2>/dev/null
2009-12-21 08:40:50 +01:00
2010-11-10 14:40:43 +11:00
add_ip_to_iface $niface $ip $maskbits || {
2009-12-21 08:40:50 +01:00
iptables -D INPUT -i $oiface -d $ip -j DROP 2> /dev/null
exit 1;
}
# cope with the script being killed while we have the interface blocked
iptables -D INPUT -i $oiface -d $ip -j DROP 2> /dev/null
# flush our route cache
2011-06-28 15:36:28 +10:00
set_proc sys/net/ipv4/route/flush 1
2009-12-21 08:40:50 +01:00
# propagate the new mac address
ctdb gratiousarp $ip $niface
# tickle all existing connections, so that dropped packets
# are retransmited and the tcp streams work
tickle_tcp_connections $ip
;;
2007-06-04 15:09:03 +10:00
###########################################
# called when ctdbd has finished a recovery
recovered)
;;
####################################
# called when ctdbd is shutting down
shutdown)
;;
2007-06-06 12:08:42 +10:00
monitor)
2011-06-28 16:27:01 +10:00
monitor_interfaces || exit 1
2007-06-06 12:08:42 +10:00
;;
2009-12-01 17:43:47 +11:00
*)
ctdb_standard_event_handler "$@"
2009-11-19 15:00:17 +11:00
;;
2007-06-04 15:09:03 +10:00
esac
exit 0
2007-09-04 09:50:07 +10:00