2009-06-16 06:47:59 +04:00
#!/bin/bash
test_info( )
{
cat <<EOF
Verify that NFS connections are monitored and that NFS tickles are sent.
We create a connection to the NFS server on a node and confirm that
this connection is registered in the nfs-tickles/ subdirectory in
2016-03-08 01:44:44 +03:00
shared storage. Then kill ctdbd on the relevant NFS server node and
ensure that the takeover node sends an appropriate reset packet.
2009-06-16 06:47:59 +04:00
Prerequisites:
* An active CTDB cluster with at least 2 nodes with public addresses.
* Test must be run on a real or virtual cluster rather than against
local daemons.
* Test must not be run from a cluster node.
* Cluster nodes must be listening on the NFS TCP port ( 2049) .
Expected results:
2016-03-08 01:44:44 +03:00
* CTDB should correctly record the socket and on failover the takeover
node should send a reset packet.
2009-06-16 06:47:59 +04:00
EOF
}
2012-04-18 08:55:21 +04:00
. " ${ TEST_SCRIPTS_DIR } /integration.bash "
2009-06-16 06:47:59 +04:00
set -e
2018-10-08 07:04:24 +03:00
ctdb_test_init
2009-06-16 06:47:59 +04:00
ctdb_test_check_real_cluster
2009-07-06 11:52:11 +04:00
cluster_is_healthy
2013-11-28 09:43:55 +04:00
# We need this for later, so we know how long to run nc for.
2010-08-27 05:43:50 +04:00
try_command_on_node any $CTDB getvar MonitorInterval
2009-06-16 06:47:59 +04:00
monitor_interval = " ${ out #*= } "
#echo "Monitor interval on node $test_node is $monitor_interval seconds."
2009-07-08 07:37:52 +04:00
select_test_node_and_ips
2014-02-28 08:54:05 +04:00
try_command_on_node $test_node " $CTDB listnodes | wc -l "
numnodes = " $out "
2009-06-16 06:47:59 +04:00
test_port = 2049
echo " Connecting to node ${ test_node } on IP ${ test_ip } : ${ test_port } with netcat... "
2018-03-08 03:49:56 +03:00
sleep $(( monitor_interval * 4 )) | nc $test_ip $test_port &
2009-06-16 06:47:59 +04:00
nc_pid = $!
ctdb_test_exit_hook_add " kill $nc_pid >/dev/null 2>&1 "
wait_until_get_src_socket "tcp" " ${ test_ip } : ${ test_port } " $nc_pid "nc"
src_socket = " $out "
echo " Source socket is $src_socket "
2009-11-13 01:44:34 +03:00
wait_for_monitor_event $test_node
2009-06-16 06:47:59 +04:00
2014-02-28 08:54:05 +04:00
echo "Wait until NFS connection is tracked by CTDB on test node ..."
wait_until 10 check_tickles $test_node $test_ip $test_port $src_socket
2010-08-27 05:40:44 +04:00
2014-02-28 08:54:05 +04:00
echo "Getting TicklesUpdateInterval..."
try_command_on_node $test_node $CTDB getvar TickleUpdateInterval
update_interval = " $out "
2009-06-16 06:47:59 +04:00
2014-02-28 08:54:05 +04:00
echo "Wait until NFS connection is tracked by CTDB on all nodes..."
wait_until $(( $update_interval * 2 )) \
check_tickles_all $numnodes $test_ip $test_port $src_socket
2009-06-16 06:47:59 +04:00
2009-07-03 14:44:55 +04:00
tcptickle_sniff_start $src_socket " ${ test_ip } : ${ test_port } "
2009-06-16 06:47:59 +04:00
2010-08-27 05:40:44 +04:00
# We need to be nasty to make that the node being failed out doesn't
2014-12-03 04:10:07 +03:00
# get a chance to send any tickles and confuse our sniff. IPs also
# need to be dropped because we're simulating a dead node rather than
# a CTDB failure. To properly handle a CTDB failure we would need a
# watchdog to drop the IPs when CTDB disappears.
2010-08-27 05:40:44 +04:00
echo " Killing ctdbd on ${ test_node } ... "
2014-12-03 04:10:07 +03:00
try_command_on_node -v $test_node " killall -9 ctdbd ; $CTDB_TEST_WRAPPER drop_ips ${ test_node_ips } "
2010-08-27 05:40:44 +04:00
wait_until_node_has_status $test_node disconnected
2009-06-16 06:47:59 +04:00
2009-07-03 14:44:55 +04:00
tcptickle_sniff_wait_show