2007-04-11 18:54:22 +10:00
/*
standalone ctdb daemon
Copyright ( C ) Andrew Tridgell 2006
2007-05-31 13:50:53 +10:00
This program is free software ; you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
2007-07-10 15:29:31 +10:00
the Free Software Foundation ; either version 3 of the License , or
2007-05-31 13:50:53 +10:00
( at your option ) any later version .
This program is distributed in the hope that it will be useful ,
2007-04-11 18:54:22 +10:00
but WITHOUT ANY WARRANTY ; without even the implied warranty of
2007-05-31 13:50:53 +10:00
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
You should have received a copy of the GNU General Public License
2007-07-10 15:29:31 +10:00
along with this program ; if not , see < http : //www.gnu.org/licenses/>.
2007-04-11 18:54:22 +10:00
*/
2015-10-26 16:50:46 +11:00
# include "replace.h"
2007-04-11 18:54:22 +10:00
# include "system/filesys.h"
2008-01-17 11:33:23 +11:00
# include "system/time.h"
2007-04-11 22:19:46 +10:00
# include "system/wait.h"
2007-10-16 11:29:33 +10:00
# include "system/network.h"
2015-10-26 16:50:46 +11:00
# include <popt.h>
# include <talloc.h>
/* Allow use of deprecated function tevent_loop_allow_nesting() */
# define TEVENT_DEPRECATED
# include <tevent.h>
# include "lib/util/debug.h"
# include "lib/util/samba_util.h"
# include "ctdb_private.h"
2015-03-17 14:30:18 +11:00
# include "common/reqid.h"
2015-10-23 14:11:53 +11:00
# include "common/system.h"
2015-10-23 14:17:34 +11:00
# include "common/common.h"
2015-11-11 15:41:10 +11:00
# include "common/logging.h"
2007-04-11 13:17:36 +02:00
2007-05-29 12:49:25 +10:00
static struct {
2016-11-18 14:52:38 +11:00
const char * socket ;
const char * debuglevel ;
2007-06-02 10:03:28 +10:00
const char * nlist ;
const char * transport ;
const char * myaddress ;
2007-05-29 12:49:25 +10:00
const char * public_address_list ;
2007-08-15 14:44:03 +10:00
const char * event_script_dir ;
2009-03-31 14:23:31 +11:00
const char * notification_script ;
2014-08-11 17:07:41 +10:00
const char * logging ;
2016-05-17 18:28:56 +10:00
const char * recovery_lock ;
2007-06-02 10:03:28 +10:00
const char * db_dir ;
2007-09-21 12:24:02 +10:00
const char * db_dir_persistent ;
2009-11-23 14:38:03 +01:00
const char * db_dir_state ;
2007-09-10 14:26:35 +10:00
const char * public_interface ;
2009-12-16 20:59:15 +10:30
int valgrinding ;
2011-01-24 11:42:50 +11:00
int nosetsched ;
2008-02-22 09:42:52 +11:00
int start_as_disabled ;
2009-07-09 11:57:20 +10:00
int start_as_stopped ;
2008-05-06 10:41:22 +10:00
int no_lmaster ;
int no_recmaster ;
2008-10-17 07:56:12 +11:00
int script_log_level ;
2008-11-24 19:06:02 +11:00
int no_publicipcheck ;
2009-12-07 13:28:11 +01:00
int max_persistent_check_errors ;
2016-11-18 14:52:38 +11:00
int torture ;
2007-05-29 12:49:25 +10:00
} options = {
2017-08-11 15:18:13 +10:00
. socket = CTDB_SOCKET ,
2016-11-30 16:46:19 +11:00
. debuglevel = " NOTICE " ,
2013-10-21 19:33:10 +11:00
. nlist = NULL ,
2013-10-21 19:52:01 +11:00
. public_address_list = NULL ,
2007-06-02 10:03:28 +10:00
. transport = " tcp " ,
2013-10-15 14:10:58 +11:00
. event_script_dir = NULL ,
2014-08-11 17:07:41 +10:00
. logging = " file: " LOGDIR " /log.ctdb " ,
2013-10-03 15:47:30 +10:00
. db_dir = CTDB_VARDIR ,
. db_dir_persistent = CTDB_VARDIR " /persistent " ,
. db_dir_state = CTDB_VARDIR " /state " ,
2008-10-17 07:56:12 +11:00
. script_log_level = DEBUG_ERR ,
2007-05-29 12:49:25 +10:00
} ;
2008-10-17 07:56:12 +11:00
int script_log_level ;
2010-06-22 22:52:34 +09:30
bool fast_start ;
2007-04-11 18:54:22 +10:00
2007-06-07 22:06:19 +10:00
/*
called by the transport layer when a packet comes in
*/
static void ctdb_recv_pkt ( struct ctdb_context * ctdb , uint8_t * data , uint32_t length )
{
struct ctdb_req_header * hdr = ( struct ctdb_req_header * ) data ;
2010-09-29 10:38:41 +10:00
CTDB_INCREMENT_STAT ( ctdb , node_packets_recv ) ;
2007-06-07 22:06:19 +10:00
/* up the counter for this source node, so we know its alive */
2007-09-04 10:09:58 +10:00
if ( ctdb_validate_pnn ( ctdb , hdr - > srcnode ) ) {
2007-06-07 22:06:19 +10:00
/* as a special case, redirected calls don't increment the rx_cnt */
if ( hdr - > operation ! = CTDB_REQ_CALL | |
2015-10-29 16:26:29 +11:00
( ( struct ctdb_req_call_old * ) hdr ) - > hopcount = = 0 ) {
2007-06-07 22:06:19 +10:00
ctdb - > nodes [ hdr - > srcnode ] - > rx_cnt + + ;
}
}
ctdb_input_pkt ( ctdb , hdr ) ;
}
static const struct ctdb_upcalls ctdb_upcalls = {
. recv_pkt = ctdb_recv_pkt ,
. node_dead = ctdb_node_dead ,
. node_connected = ctdb_node_connected
} ;
2007-05-29 15:26:38 +10:00
2007-04-11 18:54:22 +10:00
/*
main program
*/
int main ( int argc , const char * argv [ ] )
{
struct ctdb_context * ctdb ;
2007-05-15 09:44:33 +10:00
int interactive = 0 ;
2007-04-11 18:54:22 +10:00
struct poptOption popt_options [ ] = {
POPT_AUTOHELP
2016-11-18 14:52:38 +11:00
{ " socket " , 0 , POPT_ARG_STRING , & options . socket , 0 , " local socket name " , " filename " } ,
{ " debug " , ' d ' , POPT_ARG_STRING , & options . debuglevel , 0 , " debug level " , NULL } ,
2007-05-15 09:44:33 +10:00
{ " interactive " , ' i ' , POPT_ARG_NONE , & interactive , 0 , " don't fork " , NULL } ,
2007-05-29 12:49:25 +10:00
{ " public-addresses " , 0 , POPT_ARG_STRING , & options . public_address_list , 0 , " public address list file " , " filename " } ,
2007-09-10 14:26:35 +10:00
{ " public-interface " , 0 , POPT_ARG_STRING , & options . public_interface , 0 , " public interface " , " interface " } ,
2007-08-15 14:44:03 +10:00
{ " event-script-dir " , 0 , POPT_ARG_STRING , & options . event_script_dir , 0 , " event script directory " , " dirname " } ,
2014-08-11 17:07:41 +10:00
{ " logging " , 0 , POPT_ARG_STRING , & options . logging , 0 , " logging method to be used " , NULL } ,
2007-06-02 10:03:28 +10:00
{ " nlist " , 0 , POPT_ARG_STRING , & options . nlist , 0 , " node list file " , " filename " } ,
2009-03-31 14:23:31 +11:00
{ " notification-script " , 0 , POPT_ARG_STRING , & options . notification_script , 0 , " notification script " , " filename " } ,
2007-06-02 10:03:28 +10:00
{ " listen " , 0 , POPT_ARG_STRING , & options . myaddress , 0 , " address to listen on " , " address " } ,
{ " transport " , 0 , POPT_ARG_STRING , & options . transport , 0 , " protocol transport " , NULL } ,
{ " dbdir " , 0 , POPT_ARG_STRING , & options . db_dir , 0 , " directory for the tdb files " , NULL } ,
2007-09-21 12:24:02 +10:00
{ " dbdir-persistent " , 0 , POPT_ARG_STRING , & options . db_dir_persistent , 0 , " directory for persistent tdb files " , NULL } ,
2009-11-23 14:38:03 +01:00
{ " dbdir-state " , 0 , POPT_ARG_STRING , & options . db_dir_state , 0 , " directory for internal state tdb files " , NULL } ,
2016-05-17 18:28:56 +10:00
{ " reclock " , 0 , POPT_ARG_STRING , & options . recovery_lock , 0 , " recovery lock " , " lock " } ,
2013-04-15 13:32:57 +10:00
{ " pidfile " , 0 , POPT_ARG_STRING , & ctdbd_pidfile , 0 , " location of PID file " , " filename " } ,
2011-01-10 13:35:39 +11:00
{ " valgrinding " , 0 , POPT_ARG_NONE , & options . valgrinding , 0 , " disable setscheduler SCHED_FIFO call, use mmap for tdbs " , NULL } ,
2011-01-24 11:42:50 +11:00
{ " nosetsched " , 0 , POPT_ARG_NONE , & options . nosetsched , 0 , " disable setscheduler SCHED_FIFO call, use mmap for tdbs " , NULL } ,
2008-02-22 09:42:52 +11:00
{ " start-as-disabled " , 0 , POPT_ARG_NONE , & options . start_as_disabled , 0 , " Node starts in disabled state " , NULL } ,
2009-07-09 11:57:20 +10:00
{ " start-as-stopped " , 0 , POPT_ARG_NONE , & options . start_as_stopped , 0 , " Node starts in stopped state " , NULL } ,
2008-05-06 10:41:22 +10:00
{ " no-lmaster " , 0 , POPT_ARG_NONE , & options . no_lmaster , 0 , " disable lmaster role on this node " , NULL } ,
{ " no-recmaster " , 0 , POPT_ARG_NONE , & options . no_recmaster , 0 , " disable recmaster role on this node " , NULL } ,
2013-10-21 19:42:32 +11:00
{ " script-log-level " , 0 , POPT_ARG_INT , & options . script_log_level , 0 , " log level of event script output " , NULL } ,
2010-01-05 11:04:24 +01:00
{ " nopublicipcheck " , 0 , POPT_ARG_NONE , & options . no_publicipcheck , 0 , " don't check we have/don't have the correct public ip addresses " , NULL } ,
2009-12-07 13:28:11 +01:00
{ " max-persistent-check-errors " , 0 , POPT_ARG_INT ,
& options . max_persistent_check_errors , 0 ,
" max allowed persistent check errors (default 0) " , NULL } ,
2010-06-22 22:52:34 +09:30
{ " sloppy-start " , 0 , POPT_ARG_NONE , & fast_start , 0 , " Do not perform full recovery on start " , NULL } ,
2016-11-18 14:52:38 +11:00
{ " torture " , 0 , POPT_ARG_NONE , & options . torture , 0 , " enable nastiness in library " , NULL } ,
2007-04-11 18:54:22 +10:00
POPT_TABLEEND
} ;
2007-05-29 12:49:25 +10:00
int opt , ret ;
2007-04-11 18:54:22 +10:00
const char * * extra_argv ;
poptContext pc ;
2015-10-26 16:50:09 +11:00
struct tevent_context * ev ;
2007-04-11 18:54:22 +10:00
pc = poptGetContext ( argv [ 0 ] , argc , argv , popt_options , POPT_CONTEXT_KEEP_FIRST ) ;
while ( ( opt = poptGetNextOpt ( pc ) ) ! = - 1 ) {
switch ( opt ) {
default :
fprintf ( stderr , " Invalid option %s: %s \n " ,
poptBadOption ( pc , 0 ) , poptStrerror ( opt ) ) ;
exit ( 1 ) ;
}
}
2016-11-28 09:51:48 +11:00
/* If there are extra arguments then exit with usage message */
2007-04-11 18:54:22 +10:00
extra_argv = poptGetArgs ( pc ) ;
if ( extra_argv ) {
extra_argv + + ;
2016-11-28 09:51:48 +11:00
if ( extra_argv [ 0 ] ) {
poptPrintHelp ( pc , stdout , 0 ) ;
exit ( 1 ) ;
}
2007-04-11 18:54:22 +10:00
}
2008-01-16 09:44:48 +11:00
talloc_enable_null_tracking ( ) ;
2014-08-15 15:55:20 +10:00
fault_setup ( ) ;
2007-04-11 13:17:36 +02:00
2015-10-26 16:50:09 +11:00
ev = tevent_context_init ( NULL ) ;
2016-07-27 11:45:49 +10:00
if ( ev = = NULL ) {
2016-11-30 17:04:54 +11:00
fprintf ( stderr , " tevent_context_init() failed \n " ) ;
2016-07-27 11:45:49 +10:00
exit ( 1 ) ;
}
2010-08-18 10:11:59 +10:00
tevent_loop_allow_nesting ( ev ) ;
2007-04-11 18:54:22 +10:00
2016-11-18 14:52:38 +11:00
ctdb = ctdb_init ( ev ) ;
if ( ctdb = = NULL ) {
fprintf ( stderr , " Failed to init ctdb \n " ) ;
exit ( 1 ) ;
}
if ( options . torture = = 1 ) {
ctdb_set_flags ( ctdb , CTDB_FLAG_TORTURE ) ;
}
2016-11-29 17:52:00 +11:00
/* Log to stderr when running as interactive */
if ( interactive ) {
options . logging = " file: " ;
}
2016-11-30 16:46:19 +11:00
/* Initialize logging and set the debug level */
if ( ! ctdb_logging_init ( ctdb , options . logging , options . debuglevel ) ) {
exit ( 1 ) ;
2016-11-18 14:52:38 +11:00
}
2016-11-30 16:46:19 +11:00
setenv ( " CTDB_LOGGING " , options . logging , 1 ) ;
setenv ( " CTDB_DEBUGLEVEL " , debug_level_to_string ( DEBUGLEVEL ) , 1 ) ;
2016-11-18 14:52:38 +11:00
setenv ( " CTDB_SOCKET " , options . socket , 1 ) ;
ret = ctdb_set_socketname ( ctdb , options . socket ) ;
if ( ret = = - 1 ) {
2016-11-30 17:04:54 +11:00
DEBUG ( DEBUG_ERR , ( " ctdb_set_socketname() failed \n " ) ) ;
2016-11-18 14:52:38 +11:00
exit ( 1 ) ;
}
2007-04-11 18:54:22 +10:00
2008-02-22 09:42:52 +11:00
ctdb - > start_as_disabled = options . start_as_disabled ;
2009-07-09 11:57:20 +10:00
ctdb - > start_as_stopped = options . start_as_stopped ;
2008-02-22 09:42:52 +11:00
2008-10-17 07:56:12 +11:00
script_log_level = options . script_log_level ;
2011-08-04 13:44:25 +10:00
DEBUG ( DEBUG_NOTICE , ( " CTDB starting on node \n " ) ) ;
2010-09-22 10:59:01 +10:00
2008-01-17 11:33:23 +11:00
gettimeofday ( & ctdb - > ctdbd_start_time , NULL ) ;
2008-07-02 13:55:59 +10:00
gettimeofday ( & ctdb - > last_recovery_started , NULL ) ;
gettimeofday ( & ctdb - > last_recovery_finished , NULL ) ;
2007-06-07 22:06:19 +10:00
ctdb - > recovery_mode = CTDB_RECOVERY_NORMAL ;
ctdb - > recovery_master = ( uint32_t ) - 1 ;
ctdb - > upcalls = & ctdb_upcalls ;
2016-05-17 18:24:53 +10:00
2016-05-17 18:28:56 +10:00
if ( options . recovery_lock = = NULL ) {
DEBUG ( DEBUG_WARNING , ( " Recovery lock not set \n " ) ) ;
2016-05-17 18:24:53 +10:00
}
2016-05-17 18:28:56 +10:00
ctdb - > recovery_lock = options . recovery_lock ;
2007-06-07 22:06:19 +10:00
2016-04-05 17:11:17 +10:00
TALLOC_FREE ( ctdb - > idr ) ;
2015-03-17 14:30:18 +11:00
ret = reqid_init ( ctdb , 0 , & ctdb - > idr ) ; ;
if ( ret ! = 0 ) {
2016-11-30 17:04:54 +11:00
DEBUG ( DEBUG_ERR , ( " reqid_init failed (%s) \n " , strerror ( ret ) ) ) ;
2015-03-17 14:30:18 +11:00
exit ( 1 ) ;
}
2007-06-07 22:06:19 +10:00
ctdb_tunables_set_defaults ( ctdb ) ;
2007-06-02 10:03:28 +10:00
ret = ctdb_set_transport ( ctdb , options . transport ) ;
if ( ret = = - 1 ) {
2016-11-30 17:04:54 +11:00
DEBUG ( DEBUG_ERR , ( " ctdb_set_transport failed - %s \n " ,
ctdb_errstr ( ctdb ) ) ) ;
2007-06-02 10:03:28 +10:00
exit ( 1 ) ;
}
/* tell ctdb what address to listen on */
if ( options . myaddress ) {
ret = ctdb_set_address ( ctdb , options . myaddress ) ;
if ( ret = = - 1 ) {
2016-11-30 17:04:54 +11:00
DEBUG ( DEBUG_ERR , ( " ctdb_set_address failed - %s \n " ,
ctdb_errstr ( ctdb ) ) ) ;
2007-06-02 10:03:28 +10:00
exit ( 1 ) ;
}
}
2008-05-06 10:02:27 +10:00
/* set ctdbd capabilities */
2015-09-17 16:13:55 +10:00
ctdb - > capabilities = CTDB_CAP_DEFAULT ;
2015-10-08 20:25:20 +11:00
if ( options . no_lmaster ! = 0 ) {
ctdb - > capabilities & = ~ CTDB_CAP_LMASTER ;
2008-05-06 10:41:22 +10:00
}
2015-10-08 20:25:20 +11:00
if ( options . no_recmaster ! = 0 ) {
ctdb - > capabilities & = ~ CTDB_CAP_RECMASTER ;
2008-05-06 10:41:22 +10:00
}
2008-05-06 10:02:27 +10:00
2012-12-04 14:28:06 +11:00
/* Initialise this node's PNN to the unknown value. This will
* be set to the correct value by either ctdb_add_node ( ) as
* part of loading the nodes file or by
* ctdb_tcp_listen_automatic ( ) when the transport is
* initialised . At some point we should de - optimise this and
* pull it out into ctdb_start_daemon ( ) so it is done clearly
* and only in one place .
*/
ctdb - > pnn = - 1 ;
2013-10-21 19:33:10 +11:00
/* Default value for CTDB_BASE - don't override */
2014-06-23 18:03:17 +10:00
setenv ( " CTDB_BASE " , CTDB_ETCDIR , 0 ) ;
2013-10-21 19:33:10 +11:00
2007-06-02 10:03:28 +10:00
/* tell ctdb what nodes are available */
2013-10-21 19:33:10 +11:00
if ( options . nlist ! = NULL ) {
ctdb - > nodes_file = options . nlist ;
} else {
ctdb - > nodes_file =
talloc_asprintf ( ctdb , " %s/nodes " , getenv ( " CTDB_BASE " ) ) ;
if ( ctdb - > nodes_file = = NULL ) {
2016-11-30 17:04:54 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Out of memory \n " ) ) ;
2013-10-21 19:33:10 +11:00
exit ( 1 ) ;
}
}
2008-02-19 14:44:48 +11:00
ctdb_load_nodes_file ( ctdb ) ;
2007-06-02 10:03:28 +10:00
2013-10-21 19:36:36 +11:00
ctdb - > db_directory = options . db_dir ;
2014-06-06 15:24:20 +10:00
mkdir_p_or_die ( ctdb - > db_directory , 0700 ) ;
2013-10-21 19:36:36 +11:00
2013-10-21 19:36:36 +11:00
ctdb - > db_directory_persistent = options . db_dir_persistent ;
2014-06-06 15:24:20 +10:00
mkdir_p_or_die ( ctdb - > db_directory_persistent , 0700 ) ;
2013-10-21 19:36:36 +11:00
2013-10-21 19:36:36 +11:00
ctdb - > db_directory_state = options . db_dir_state ;
2014-06-06 15:24:20 +10:00
mkdir_p_or_die ( ctdb - > db_directory_state , 0700 ) ;
2007-06-02 10:03:28 +10:00
2007-09-10 14:26:35 +10:00
if ( options . public_interface ) {
ctdb - > default_public_interface = talloc_strdup ( ctdb , options . public_interface ) ;
CTDB_NO_MEMORY ( ctdb , ctdb - > default_public_interface ) ;
}
2013-10-15 14:10:58 +11:00
if ( options . event_script_dir ! = NULL ) {
ctdb - > event_script_dir = options . event_script_dir ;
} else {
ctdb - > event_script_dir = talloc_asprintf ( ctdb , " %s/events.d " ,
getenv ( " CTDB_BASE " ) ) ;
if ( ctdb - > event_script_dir = = NULL ) {
2016-11-30 17:04:54 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Out of memory \n " ) ) ;
2013-10-15 14:10:58 +11:00
exit ( 1 ) ;
}
2007-08-15 14:44:03 +10:00
}
2009-03-31 14:23:31 +11:00
if ( options . notification_script ! = NULL ) {
ret = ctdb_set_notification_script ( ctdb , options . notification_script ) ;
if ( ret = = - 1 ) {
2016-11-30 17:04:54 +11:00
DEBUG ( DEBUG_ERR , ( " Unable to setup notification script \n " ) ) ;
2009-03-31 14:23:31 +11:00
exit ( 1 ) ;
}
}
2016-06-17 18:09:37 +10:00
ctdb - > valgrinding = ( options . valgrinding = = 1 ) ;
2016-06-20 10:42:43 +02:00
ctdb - > do_setsched = ( options . nosetsched ! = 1 ) ;
if ( ctdb - > valgrinding ) {
2016-06-17 18:10:16 +10:00
ctdb - > do_setsched = false ;
2011-01-24 11:42:50 +11:00
}
2007-07-13 08:47:02 +10:00
2013-10-21 19:52:01 +11:00
ctdb - > public_addresses_file = options . public_address_list ;
2016-06-17 18:09:37 +10:00
ctdb - > do_checkpublicip = ( options . no_publicipcheck = = 0 ) ;
2012-03-22 15:27:25 +11:00
2009-12-07 13:28:11 +01:00
if ( options . max_persistent_check_errors < 0 ) {
ctdb - > max_persistent_check_errors = 0xFFFFFFFFFFFFFFFFLL ;
} else {
ctdb - > max_persistent_check_errors = ( uint64_t ) options . max_persistent_check_errors ;
}
2007-04-29 16:19:40 +02:00
/* start the protocol running (as a child) */
2014-08-08 20:57:05 +10:00
return ctdb_start_daemon ( ctdb , interactive ? false : true ) ;
2007-04-11 18:54:22 +10:00
}