1
0
mirror of https://github.com/samba-team/samba.git synced 2025-01-25 06:04:04 +03:00
samba-mirror/ctdb/config/ctdbd_wrapper
Martin Schwenke 4b652c1527 ctdb-scripts: Don't bother checking PID file when starting ctdbd
This is an optimisation that can cause incorrect results.  If ctdbd
was killed and there is a stale PID file then this will often cause
"CTDB exited during initialisation".  The wrapper reads the old PID
from the PID file, finds the PID gone, complains and exits.

It is better to drop this code and finally get this right.  If ctdbd
does exit early then it will take CTDB_STARTUP_TIMEOUT (default 10)
seconds before the wrapper fails.  That's not too bad...

Signed-off-by: Martin Schwenke <martin@meltin.net>
Reviewed-by: Amitay Isaacs <amitay@gmail.com>
2017-11-07 03:53:27 +01:00

300 lines
7.7 KiB
Bash
Executable File

#!/bin/sh
# ctdbd wrapper - start or stop CTDB
usage ()
{
echo "usage: ctdbd_wrapper <pidfile> { start | stop }"
exit 1
}
[ $# -eq 2 ] || usage
pidfile="$1"
action="$2"
############################################################
if [ -z "$CTDB_BASE" ] ; then
export CTDB_BASE="/usr/local/etc/ctdb"
fi
. "${CTDB_BASE}/functions"
loadconfig "ctdb"
[ -n "$CTDB_SOCKET" ] && export CTDB_SOCKET
ctdbd="${CTDBD:-/usr/local/sbin/ctdbd}"
############################################################
# ctdbd_is_running()
# Check if ctdbd is running. ctdbd is only considered to running if
# the PID in the PID file is active and is called "ctdbd". Return
# true if this is the case. Print the PID regardless, since it can be
# used to kill stale processes in the session.
ctdbd_is_running ()
{
if read _pid 2>/dev/null <"$pidfile" ; then
echo "$_pid"
# This could be optimised with ps options -q and -h.
# However, -q is not generally available because it is
# fairly new and -h is not in some older distros. The
# options below are portable.
_cmd=$(ps -p "$_pid" -o comm | tail -n +2)
[ "$_cmd" = "ctdbd" ]
else
# Missing/empty PID file
return 1
fi
}
############################################################
# If necessary, mount volatile database directory on tmpfs
dbdir_tmpfs_start ()
{
if [ -z "$CTDB_DBDIR_TMPFS_OPTIONS" ] ; then
return
fi
# Shortcut for readability
_opts="$CTDB_DBDIR_TMPFS_OPTIONS"
mkdir -p "$CTDB_DBDIR" || exit $?
# If already mounted then remount, otherwise mount
if findmnt -t tmpfs "$CTDB_DBDIR" >/dev/null ; then
mount -t tmpfs -o "remount,$_opts" none "$CTDB_DBDIR" || \
exit $?
else
mount -t tmpfs -o "$_opts" none "$CTDB_DBDIR" || exit $?
fi
}
# If necessary, unmount volatile database tmpfs directory on exit
dbdir_tmpfs_stop ()
{
if [ -z "$CTDB_DBDIR_TMPFS_OPTIONS" ] ; then
return
fi
if [ -d "$CTDB_DBDIR" ] && findmnt -t tmpfs "$CTDB_DBDIR" >/dev/null ; then
umount "$CTDB_DBDIR"
fi
}
# Only the nested function references its arguments
# shellcheck disable=SC2120
build_ctdb_options ()
{
ctdb_options=""
maybe_set ()
{
# If the given variable isn't set then do nothing
[ -n "$2" ] || return
# If a required value for the variable and it doesn't match,
# then do nothing
[ -z "$3" -o "$3" = "$2" ] || return
val="'$2'"
case "$1" in
--*) sep="=" ;;
-*) sep=" " ;;
esac
# For these options we're only passing a value-less flag.
if [ -n "$3" ] ; then
val=""
sep=""
fi
ctdb_options="${ctdb_options}${ctdb_options:+ }${1}${sep}${val}"
}
if [ -z "$CTDB_RECOVERY_LOCK" ] ; then
echo "No recovery lock specified. Starting CTDB without split brain prevention."
fi
maybe_set "--reclock" "$CTDB_RECOVERY_LOCK"
maybe_set "--pidfile" "$pidfile"
# build up ctdb_options variable from optional parameters
maybe_set "--logging" "$CTDB_LOGGING"
maybe_set "--nlist" "$CTDB_NODES"
maybe_set "--socket" "$CTDB_SOCKET"
maybe_set "--listen" "$CTDB_NODE_ADDRESS"
maybe_set "--public-addresses" "$CTDB_PUBLIC_ADDRESSES"
maybe_set "--public-interface" "$CTDB_PUBLIC_INTERFACE"
maybe_set "--dbdir" "$CTDB_DBDIR"
maybe_set "--dbdir-persistent" "$CTDB_DBDIR_PERSISTENT"
maybe_set "--dbdir-state" "$CTDB_DBDIR_STATE"
maybe_set "--event-script-dir" "$CTDB_EVENT_SCRIPT_DIR"
maybe_set "--transport" "$CTDB_TRANSPORT"
maybe_set "-d" "$CTDB_DEBUGLEVEL"
maybe_set "--notification-script" "$CTDB_NOTIFY_SCRIPT"
maybe_set "--start-as-disabled" "$CTDB_START_AS_DISABLED" "yes"
maybe_set "--start-as-stopped " "$CTDB_START_AS_STOPPED" "yes"
maybe_set "--no-recmaster" "$CTDB_CAPABILITY_RECMASTER" "no"
maybe_set "--no-lmaster" "$CTDB_CAPABILITY_LMASTER" "no"
maybe_set "--nosetsched" "$CTDB_NOSETSCHED" "yes"
maybe_set "--script-log-level" "$CTDB_SCRIPT_LOG_LEVEL"
maybe_set "--max-persistent-check-errors" "$CTDB_MAX_PERSISTENT_CHECK_ERRORS"
}
export_debug_variables ()
{
[ -n "$CTDB_DEBUG_HUNG_SCRIPT" ] && export CTDB_DEBUG_HUNG_SCRIPT
[ -n "$CTDB_EXTERNAL_TRACE" ] && export CTDB_EXTERNAL_TRACE
[ -n "$CTDB_DEBUG_LOCKS" ] && export CTDB_DEBUG_LOCKS
}
kill_ctdbd ()
{
_session="$1"
if [ -n "$_session" ] ; then
pkill -9 -s "$_session" 2>/dev/null
fi
}
############################################################
start()
{
if _session=$(ctdbd_is_running) ; then
echo "CTDB is already running"
return 0
fi
# About to start new $ctdbd. The main daemon is not running but
# there may still be other processes around, so do some cleanup.
kill_ctdbd "$_session"
dbdir_tmpfs_start
# build_ctdb_options() takes no arguments
# shellcheck disable=SC2119
build_ctdb_options
export_debug_variables
# Explicitly trying to disable core files, no other way
# shellcheck disable=SC2039
if [ "$CTDB_SUPPRESS_COREFILE" = "yes" ]; then
ulimit -c 0
else
ulimit -c unlimited
fi
# Unsupported option easily avoided by not using configuration variable
# shellcheck disable=SC2039
if [ -n "$CTDB_MAX_OPEN_FILES" ]; then
ulimit -n "$CTDB_MAX_OPEN_FILES"
fi
_d=$(dirname "$pidfile")
mkdir -p "$_d"
if [ -n "$CTDB_VALGRIND" -a "$CTDB_VALGRIND" != "no" ] ; then
if [ "$CTDB_VALGRIND" = "yes" ] ; then
ctdbd="valgrind -q --log-file=/usr/local/var/log/ctdb_valgrind ${ctdbd}"
else
ctdbd="${CTDB_VALGRIND} ${ctdbd}"
fi
ctdb_options="${ctdb_options} --valgrinding"
fi
case "$CTDB_LOGGING" in
syslog:udp|syslog:udp-rfc5424)
logger -t ctdbd "CTDB is being run with ${CTDB_LOGGING}. If nothing is logged then check your syslogd configuration"
;;
syslog|syslog:*) : ;;
file:*)
logger -t ctdbd "CTDB is being run without syslog enabled. Logs will be in ${CTDB_LOGGING#file:}"
;;
*)
logger -t ctdbd "CTDB is being run without syslog enabled. Logs will be in log.ctdb"
esac
eval "$ctdbd" "$ctdb_options" || return 1
# Wait until ctdbd has started and is ready to respond to clients.
_pid=""
_timeout="${CTDB_STARTUP_TIMEOUT:-10}"
_count=0
while [ "$_count" -lt "$_timeout" ] ; do
if $CTDB runstate first_recovery startup running >/dev/null 2>&1 ; then
return 0
fi
_count=$((_count + 1))
sleep 1
done
echo "Timed out waiting for initialisation - check logs - killing CTDB"
kill_ctdbd "$_pid"
drop_all_public_ips >/dev/null 2>&1
return 1
}
stop()
{
if ! _session=$(ctdbd_is_running) ; then
echo "CTDB is not running"
return 0
fi
$CTDB shutdown
# Wait for remaining CTDB processes to exit...
_timeout=${CTDB_SHUTDOWN_TIMEOUT:-30}
_count=0
_terminated=false
while [ "$_count" -lt "$_timeout" ] ; do
if ! pkill -0 -s "$_session" 2>/dev/null ; then
_terminated=true
break
fi
_count=$((_count + 1))
sleep 1
done
if ! $_terminated ; then
echo "Timed out waiting for CTDB to shutdown. Killing CTDB processes."
kill_ctdbd "$_session"
drop_all_public_ips >/dev/null 2>&1
sleep 1
if pkill -0 -s "$_session" ; then
# If SIGKILL didn't work then things are bad...
echo "Failed to kill all CTDB processes. Giving up."
return 1
fi
fi
dbdir_tmpfs_stop
return 0
}
############################################################
# Allow notifications for start/stop.
if [ -x "$CTDB_BASE/rc.ctdb" ] ; then
"$CTDB_BASE/rc.ctdb" "$action"
fi
case "$action" in
start) start ;;
stop) stop ;;
*)
echo "usage: $0 {start|stop}"
exit 1
esac