mirror of
https://github.com/samba-team/samba.git
synced 2025-01-11 05:18:09 +03:00
38138b42f7
The main change is to source cluster.bash instead of integration.bash. While touching the preamble, the following additional changes are also made: * Drop test_info() definition and replace it with a comment The use of test_info() is pointless. * Drop call to ctdb_test_check_real_cluster() cluster.bash now does this. * Drop call to cluster_is_healthy() This is a holdover from when the previous test would restart daemons to get things ready for a test. There was also a bug where going into recovery during the restart would sometimes cause the cluster to become unhealthy. If we really need something like this then we can add it to ctdb_test_init(). Signed-off-by: Martin Schwenke <martin@meltin.net> Reviewed-by: Amitay Isaacs <amitay@gmail.com>
79 lines
2.5 KiB
Bash
Executable File
79 lines
2.5 KiB
Bash
Executable File
#!/bin/bash
|
|
|
|
# Verify that NFS connections are monitored and that NFS tickles are sent.
|
|
|
|
# We create a connection to the NFS server on a node and confirm that
|
|
# this connection is registered in the nfs-tickles/ subdirectory in
|
|
# shared storage. Then kill ctdbd on the relevant NFS server node and
|
|
# ensure that the takeover node sends an appropriate reset packet.
|
|
|
|
# Prerequisites:
|
|
|
|
# * An active CTDB cluster with at least 2 nodes with public addresses.
|
|
|
|
# * Test must be run on a real or virtual cluster rather than against
|
|
# local daemons.
|
|
|
|
# * Test must not be run from a cluster node.
|
|
|
|
# * Cluster nodes must be listening on the NFS TCP port (2049).
|
|
|
|
# Expected results:
|
|
|
|
# * CTDB should correctly record the socket and on failover the takeover
|
|
# node should send a reset packet.
|
|
|
|
. "${TEST_SCRIPTS_DIR}/cluster.bash"
|
|
|
|
set -e
|
|
|
|
ctdb_test_init
|
|
|
|
# We need this for later, so we know how long to run nc for.
|
|
try_command_on_node any $CTDB getvar MonitorInterval
|
|
monitor_interval="${out#*= }"
|
|
#echo "Monitor interval on node $test_node is $monitor_interval seconds."
|
|
|
|
select_test_node_and_ips
|
|
try_command_on_node $test_node "$CTDB listnodes | wc -l"
|
|
numnodes="$out"
|
|
|
|
test_port=2049
|
|
|
|
echo "Connecting to node ${test_node} on IP ${test_ip}:${test_port} with netcat..."
|
|
|
|
sleep $((monitor_interval * 4)) | nc $test_ip $test_port &
|
|
nc_pid=$!
|
|
ctdb_test_exit_hook_add "kill $nc_pid >/dev/null 2>&1"
|
|
|
|
wait_until_get_src_socket "tcp" "${test_ip}:${test_port}" $nc_pid "nc"
|
|
src_socket="$out"
|
|
echo "Source socket is $src_socket"
|
|
|
|
wait_for_monitor_event $test_node
|
|
|
|
echo "Wait until NFS connection is tracked by CTDB on test node ..."
|
|
wait_until 10 check_tickles $test_node $test_ip $test_port $src_socket
|
|
|
|
echo "Getting TicklesUpdateInterval..."
|
|
try_command_on_node $test_node $CTDB getvar TickleUpdateInterval
|
|
update_interval="$out"
|
|
|
|
echo "Wait until NFS connection is tracked by CTDB on all nodes..."
|
|
wait_until $(($update_interval * 2)) \
|
|
check_tickles_all $numnodes $test_ip $test_port $src_socket
|
|
|
|
tcptickle_sniff_start $src_socket "${test_ip}:${test_port}"
|
|
|
|
# We need to be nasty to make that the node being failed out doesn't
|
|
# get a chance to send any tickles and confuse our sniff. IPs also
|
|
# need to be dropped because we're simulating a dead node rather than
|
|
# a CTDB failure. To properly handle a CTDB failure we would need a
|
|
# watchdog to drop the IPs when CTDB disappears.
|
|
echo "Killing ctdbd on ${test_node}..."
|
|
try_command_on_node -v $test_node "killall -9 ctdbd ; $CTDB_TEST_WRAPPER drop_ips ${test_node_ips}"
|
|
|
|
wait_until_node_has_status $test_node disconnected
|
|
|
|
tcptickle_sniff_wait_show
|