2007-04-11 12:54:22 +04:00
/*
standalone ctdb daemon
Copyright ( C ) Andrew Tridgell 2006
2007-05-31 07:50:53 +04:00
This program is free software ; you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
2007-07-10 09:29:31 +04:00
the Free Software Foundation ; either version 3 of the License , or
2007-05-31 07:50:53 +04:00
( at your option ) any later version .
This program is distributed in the hope that it will be useful ,
2007-04-11 12:54:22 +04:00
but WITHOUT ANY WARRANTY ; without even the implied warranty of
2007-05-31 07:50:53 +04:00
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
You should have received a copy of the GNU General Public License
2007-07-10 09:29:31 +04:00
along with this program ; if not , see < http : //www.gnu.org/licenses/>.
2007-04-11 12:54:22 +04:00
*/
# include "includes.h"
# include "system/filesys.h"
# include "popt.h"
2008-01-17 03:33:23 +03:00
# include "system/time.h"
2007-04-11 16:19:46 +04:00
# include "system/wait.h"
2007-10-16 05:29:33 +04:00
# include "system/network.h"
2007-04-17 16:16:50 +04:00
# include "cmdline.h"
2007-04-30 00:42:23 +04:00
# include "../include/ctdb_private.h"
2007-04-11 15:17:36 +04:00
2007-05-29 06:49:25 +04:00
static struct {
2007-06-02 04:03:28 +04:00
const char * nlist ;
const char * transport ;
const char * myaddress ;
2007-05-29 06:49:25 +04:00
const char * public_address_list ;
2007-08-15 08:44:03 +04:00
const char * event_script_dir ;
2009-03-31 07:23:31 +04:00
const char * notification_script ;
2012-05-17 04:17:51 +04:00
const char * debug_hung_script ;
2007-05-29 09:26:38 +04:00
const char * logfile ;
2007-06-02 04:03:28 +04:00
const char * recovery_lock_file ;
const char * db_dir ;
2007-09-21 06:24:02 +04:00
const char * db_dir_persistent ;
2009-11-23 16:38:03 +03:00
const char * db_dir_state ;
2007-09-10 08:26:35 +04:00
const char * public_interface ;
2007-10-10 03:42:32 +04:00
const char * single_public_ip ;
2009-12-16 13:29:15 +03:00
int valgrinding ;
2011-01-24 03:42:50 +03:00
int nosetsched ;
2008-01-16 14:03:01 +03:00
int use_syslog ;
2008-02-22 01:42:52 +03:00
int start_as_disabled ;
2009-07-09 05:57:20 +04:00
int start_as_stopped ;
2008-05-06 04:41:22 +04:00
int no_lmaster ;
int no_recmaster ;
2008-07-10 04:37:22 +04:00
int lvs ;
2008-10-17 00:56:12 +04:00
int script_log_level ;
2008-11-24 11:06:02 +03:00
int no_publicipcheck ;
2009-12-07 15:28:11 +03:00
int max_persistent_check_errors ;
2007-05-29 06:49:25 +04:00
} options = {
2007-06-02 04:03:28 +04:00
. nlist = ETCDIR " /ctdb/nodes " ,
. transport = " tcp " ,
2007-08-15 08:44:03 +04:00
. event_script_dir = ETCDIR " /ctdb/events.d " ,
2009-02-04 02:15:57 +03:00
. logfile = LOGDIR " /log.ctdb " ,
2007-06-02 04:03:28 +04:00
. db_dir = VARDIR " /ctdb " ,
2007-09-21 06:24:02 +04:00
. db_dir_persistent = VARDIR " /ctdb/persistent " ,
2009-11-23 16:38:03 +03:00
. db_dir_state = VARDIR " /ctdb/state " ,
2008-10-17 00:56:12 +04:00
. script_log_level = DEBUG_ERR ,
2012-05-17 04:17:51 +04:00
. debug_hung_script = " /etc/ctdb/debug-hung-script.sh " ,
2007-05-29 06:49:25 +04:00
} ;
2008-10-17 00:56:12 +04:00
int script_log_level ;
2010-06-22 17:22:34 +04:00
bool fast_start ;
2007-04-11 12:54:22 +04:00
2007-06-07 16:06:19 +04:00
/*
called by the transport layer when a packet comes in
*/
static void ctdb_recv_pkt ( struct ctdb_context * ctdb , uint8_t * data , uint32_t length )
{
struct ctdb_req_header * hdr = ( struct ctdb_req_header * ) data ;
2010-09-29 04:38:41 +04:00
CTDB_INCREMENT_STAT ( ctdb , node_packets_recv ) ;
2007-06-07 16:06:19 +04:00
/* up the counter for this source node, so we know its alive */
2007-09-04 04:09:58 +04:00
if ( ctdb_validate_pnn ( ctdb , hdr - > srcnode ) ) {
2007-06-07 16:06:19 +04:00
/* as a special case, redirected calls don't increment the rx_cnt */
if ( hdr - > operation ! = CTDB_REQ_CALL | |
( ( struct ctdb_req_call * ) hdr ) - > hopcount = = 0 ) {
ctdb - > nodes [ hdr - > srcnode ] - > rx_cnt + + ;
}
}
ctdb_input_pkt ( ctdb , hdr ) ;
}
2008-02-19 06:44:48 +03:00
void ctdb_load_nodes_file ( struct ctdb_context * ctdb )
{
int ret ;
2007-06-07 16:06:19 +04:00
2008-02-19 06:44:48 +03:00
ret = ctdb_set_nlist ( ctdb , options . nlist ) ;
if ( ret = = - 1 ) {
DEBUG ( DEBUG_ALERT , ( " ctdb_set_nlist failed - %s \n " , ctdb_errstr ( ctdb ) ) ) ;
exit ( 1 ) ;
}
}
2007-06-07 16:06:19 +04:00
static const struct ctdb_upcalls ctdb_upcalls = {
. recv_pkt = ctdb_recv_pkt ,
. node_dead = ctdb_node_dead ,
. node_connected = ctdb_node_connected
} ;
2007-05-29 09:26:38 +04:00
2007-04-11 12:54:22 +04:00
/*
main program
*/
int main ( int argc , const char * argv [ ] )
{
struct ctdb_context * ctdb ;
2007-05-15 03:44:33 +04:00
int interactive = 0 ;
2007-04-11 12:54:22 +04:00
struct poptOption popt_options [ ] = {
POPT_AUTOHELP
2007-04-17 16:13:06 +04:00
POPT_CTDB_CMDLINE
2007-05-15 03:44:33 +04:00
{ " interactive " , ' i ' , POPT_ARG_NONE , & interactive , 0 , " don't fork " , NULL } ,
2007-05-29 06:49:25 +04:00
{ " public-addresses " , 0 , POPT_ARG_STRING , & options . public_address_list , 0 , " public address list file " , " filename " } ,
2007-09-10 08:26:35 +04:00
{ " public-interface " , 0 , POPT_ARG_STRING , & options . public_interface , 0 , " public interface " , " interface " } ,
2007-10-10 03:42:32 +04:00
{ " single-public-ip " , 0 , POPT_ARG_STRING , & options . single_public_ip , 0 , " single public ip " , " ip-address " } ,
2007-08-15 08:44:03 +04:00
{ " event-script-dir " , 0 , POPT_ARG_STRING , & options . event_script_dir , 0 , " event script directory " , " dirname " } ,
2007-05-29 09:26:38 +04:00
{ " logfile " , 0 , POPT_ARG_STRING , & options . logfile , 0 , " log file location " , " filename " } ,
2007-06-02 04:03:28 +04:00
{ " nlist " , 0 , POPT_ARG_STRING , & options . nlist , 0 , " node list file " , " filename " } ,
2009-03-31 07:23:31 +04:00
{ " notification-script " , 0 , POPT_ARG_STRING , & options . notification_script , 0 , " notification script " , " filename " } ,
2012-05-17 04:17:51 +04:00
{ " debug-hung-script " , 0 , POPT_ARG_STRING , & options . debug_hung_script , 0 , " debug script for hung eventscripts " , " filename " } ,
2007-06-02 04:03:28 +04:00
{ " listen " , 0 , POPT_ARG_STRING , & options . myaddress , 0 , " address to listen on " , " address " } ,
{ " transport " , 0 , POPT_ARG_STRING , & options . transport , 0 , " protocol transport " , NULL } ,
{ " dbdir " , 0 , POPT_ARG_STRING , & options . db_dir , 0 , " directory for the tdb files " , NULL } ,
2007-09-21 06:24:02 +04:00
{ " dbdir-persistent " , 0 , POPT_ARG_STRING , & options . db_dir_persistent , 0 , " directory for persistent tdb files " , NULL } ,
2009-11-23 16:38:03 +03:00
{ " dbdir-state " , 0 , POPT_ARG_STRING , & options . db_dir_state , 0 , " directory for internal state tdb files " , NULL } ,
2007-06-02 05:36:42 +04:00
{ " reclock " , 0 , POPT_ARG_STRING , & options . recovery_lock_file , 0 , " location of recovery lock file " , " filename " } ,
2011-01-10 05:35:39 +03:00
{ " valgrinding " , 0 , POPT_ARG_NONE , & options . valgrinding , 0 , " disable setscheduler SCHED_FIFO call, use mmap for tdbs " , NULL } ,
2011-01-24 03:42:50 +03:00
{ " nosetsched " , 0 , POPT_ARG_NONE , & options . nosetsched , 0 , " disable setscheduler SCHED_FIFO call, use mmap for tdbs " , NULL } ,
2008-01-16 14:03:01 +03:00
{ " syslog " , 0 , POPT_ARG_NONE , & options . use_syslog , 0 , " log messages to syslog " , NULL } ,
2008-02-22 01:42:52 +03:00
{ " start-as-disabled " , 0 , POPT_ARG_NONE , & options . start_as_disabled , 0 , " Node starts in disabled state " , NULL } ,
2009-07-09 05:57:20 +04:00
{ " start-as-stopped " , 0 , POPT_ARG_NONE , & options . start_as_stopped , 0 , " Node starts in stopped state " , NULL } ,
2008-05-06 04:41:22 +04:00
{ " no-lmaster " , 0 , POPT_ARG_NONE , & options . no_lmaster , 0 , " disable lmaster role on this node " , NULL } ,
{ " no-recmaster " , 0 , POPT_ARG_NONE , & options . no_recmaster , 0 , " disable recmaster role on this node " , NULL } ,
2008-07-10 04:37:22 +04:00
{ " lvs " , 0 , POPT_ARG_NONE , & options . lvs , 0 , " lvs is enabled on this node " , NULL } ,
2008-10-17 00:56:12 +04:00
{ " script-log-level " , 0 , POPT_ARG_INT , & options . script_log_level , DEBUG_ERR , " log level of event script output " , NULL } ,
2010-01-05 13:04:24 +03:00
{ " nopublicipcheck " , 0 , POPT_ARG_NONE , & options . no_publicipcheck , 0 , " don't check we have/don't have the correct public ip addresses " , NULL } ,
2009-12-07 15:28:11 +03:00
{ " max-persistent-check-errors " , 0 , POPT_ARG_INT ,
& options . max_persistent_check_errors , 0 ,
" max allowed persistent check errors (default 0) " , NULL } ,
2010-01-15 07:38:56 +03:00
{ " log-ringbuf-size " , 0 , POPT_ARG_INT , & log_ringbuf_size , DEBUG_ERR , " Number of log messages we can store in the memory ringbuffer " , NULL } ,
2010-06-22 17:22:34 +04:00
{ " sloppy-start " , 0 , POPT_ARG_NONE , & fast_start , 0 , " Do not perform full recovery on start " , NULL } ,
2007-04-11 12:54:22 +04:00
POPT_TABLEEND
} ;
2007-05-29 06:49:25 +04:00
int opt , ret ;
2007-04-11 12:54:22 +04:00
const char * * extra_argv ;
int extra_argc = 0 ;
poptContext pc ;
struct event_context * ev ;
pc = poptGetContext ( argv [ 0 ] , argc , argv , popt_options , POPT_CONTEXT_KEEP_FIRST ) ;
while ( ( opt = poptGetNextOpt ( pc ) ) ! = - 1 ) {
switch ( opt ) {
default :
fprintf ( stderr , " Invalid option %s: %s \n " ,
poptBadOption ( pc , 0 ) , poptStrerror ( opt ) ) ;
exit ( 1 ) ;
}
}
/* setup the remaining options for the main program to use */
extra_argv = poptGetArgs ( pc ) ;
if ( extra_argv ) {
extra_argv + + ;
while ( extra_argv [ extra_argc ] ) extra_argc + + ;
}
2008-01-16 01:44:48 +03:00
talloc_enable_null_tracking ( ) ;
2008-01-10 01:43:14 +03:00
ctdb_block_signal ( SIGPIPE ) ;
2010-01-07 11:21:56 +03:00
fault_setup ( " ctdbd " ) ;
2007-04-11 15:17:36 +04:00
2007-04-11 12:54:22 +04:00
ev = event_context_init ( NULL ) ;
2010-08-18 04:11:59 +04:00
tevent_loop_allow_nesting ( ev ) ;
2007-04-11 12:54:22 +04:00
2007-04-17 16:13:06 +04:00
ctdb = ctdb_cmdline_init ( ev ) ;
2007-04-11 12:54:22 +04:00
2008-02-22 01:42:52 +03:00
ctdb - > start_as_disabled = options . start_as_disabled ;
2009-07-09 05:57:20 +04:00
ctdb - > start_as_stopped = options . start_as_stopped ;
2008-02-22 01:42:52 +03:00
2008-10-17 00:56:12 +04:00
script_log_level = options . script_log_level ;
2008-01-16 14:03:01 +03:00
ret = ctdb_set_logfile ( ctdb , options . logfile , options . use_syslog ) ;
2007-08-21 03:33:03 +04:00
if ( ret = = - 1 ) {
2008-01-16 14:03:01 +03:00
printf ( " ctdb_set_logfile to %s failed - %s \n " ,
options . use_syslog ? " syslog " : options . logfile , ctdb_errstr ( ctdb ) ) ;
2007-08-21 03:33:03 +04:00
exit ( 1 ) ;
}
2011-08-04 07:44:25 +04:00
DEBUG ( DEBUG_NOTICE , ( " CTDB starting on node \n " ) ) ;
2010-09-22 04:59:01 +04:00
2008-01-17 03:33:23 +03:00
gettimeofday ( & ctdb - > ctdbd_start_time , NULL ) ;
2008-07-02 07:55:59 +04:00
gettimeofday ( & ctdb - > last_recovery_started , NULL ) ;
gettimeofday ( & ctdb - > last_recovery_finished , NULL ) ;
2007-06-07 16:06:19 +04:00
ctdb - > recovery_mode = CTDB_RECOVERY_NORMAL ;
ctdb - > recovery_master = ( uint32_t ) - 1 ;
ctdb - > upcalls = & ctdb_upcalls ;
ctdb - > idr = idr_init ( ctdb ) ;
ctdb - > recovery_lock_fd = - 1 ;
ctdb_tunables_set_defaults ( ctdb ) ;
2007-06-02 05:36:42 +04:00
ret = ctdb_set_recovery_lock_file ( ctdb , options . recovery_lock_file ) ;
if ( ret = = - 1 ) {
2008-02-04 12:07:15 +03:00
DEBUG ( DEBUG_ALERT , ( " ctdb_set_recovery_lock_file failed - %s \n " , ctdb_errstr ( ctdb ) ) ) ;
2007-06-02 05:36:42 +04:00
exit ( 1 ) ;
}
2007-06-02 04:03:28 +04:00
ret = ctdb_set_transport ( ctdb , options . transport ) ;
if ( ret = = - 1 ) {
2008-02-04 12:07:15 +03:00
DEBUG ( DEBUG_ALERT , ( " ctdb_set_transport failed - %s \n " , ctdb_errstr ( ctdb ) ) ) ;
2007-06-02 04:03:28 +04:00
exit ( 1 ) ;
}
/* tell ctdb what address to listen on */
if ( options . myaddress ) {
ret = ctdb_set_address ( ctdb , options . myaddress ) ;
if ( ret = = - 1 ) {
2008-02-04 12:07:15 +03:00
DEBUG ( DEBUG_ALERT , ( " ctdb_set_address failed - %s \n " , ctdb_errstr ( ctdb ) ) ) ;
2007-06-02 04:03:28 +04:00
exit ( 1 ) ;
}
}
2008-05-06 04:02:27 +04:00
/* set ctdbd capabilities */
2008-05-06 04:41:22 +04:00
ctdb - > capabilities = 0 ;
if ( options . no_lmaster = = 0 ) {
ctdb - > capabilities | = CTDB_CAP_LMASTER ;
}
if ( options . no_recmaster = = 0 ) {
ctdb - > capabilities | = CTDB_CAP_RECMASTER ;
}
2008-07-10 04:37:22 +04:00
if ( options . lvs ! = 0 ) {
ctdb - > capabilities | = CTDB_CAP_LVS ;
}
2008-05-06 04:02:27 +04:00
2007-06-02 04:03:28 +04:00
/* tell ctdb what nodes are available */
2008-02-19 06:44:48 +03:00
ctdb_load_nodes_file ( ctdb ) ;
2007-06-02 04:03:28 +04:00
if ( options . db_dir ) {
ret = ctdb_set_tdb_dir ( ctdb , options . db_dir ) ;
if ( ret = = - 1 ) {
2008-02-04 12:07:15 +03:00
DEBUG ( DEBUG_ALERT , ( " ctdb_set_tdb_dir failed - %s \n " , ctdb_errstr ( ctdb ) ) ) ;
2007-06-02 04:03:28 +04:00
exit ( 1 ) ;
}
}
2007-09-21 06:24:02 +04:00
if ( options . db_dir_persistent ) {
ret = ctdb_set_tdb_dir_persistent ( ctdb , options . db_dir_persistent ) ;
if ( ret = = - 1 ) {
2008-02-04 12:07:15 +03:00
DEBUG ( DEBUG_ALERT , ( " ctdb_set_tdb_dir_persistent failed - %s \n " , ctdb_errstr ( ctdb ) ) ) ;
2007-09-21 06:24:02 +04:00
exit ( 1 ) ;
}
}
2009-11-23 16:38:03 +03:00
if ( options . db_dir_state ) {
ret = ctdb_set_tdb_dir_state ( ctdb , options . db_dir_state ) ;
if ( ret = = - 1 ) {
DEBUG ( DEBUG_ALERT , ( " ctdb_set_tdb_dir_state failed - %s \n " , ctdb_errstr ( ctdb ) ) ) ;
exit ( 1 ) ;
}
}
2007-06-02 04:03:28 +04:00
2007-09-10 08:26:35 +04:00
if ( options . public_interface ) {
ctdb - > default_public_interface = talloc_strdup ( ctdb , options . public_interface ) ;
CTDB_NO_MEMORY ( ctdb , ctdb - > default_public_interface ) ;
}
2007-10-10 03:42:32 +04:00
if ( options . single_public_ip ) {
if ( options . public_interface = = NULL ) {
2008-02-04 12:07:15 +03:00
DEBUG ( DEBUG_ALERT , ( " --single_public_ip used but --public_interface is not specified. You must specify the public interface when using single public ip. Exiting \n " ) ) ;
2007-10-10 03:42:32 +04:00
exit ( 10 ) ;
}
2009-12-14 21:33:35 +03:00
ret = ctdb_set_single_public_ip ( ctdb , options . public_interface ,
options . single_public_ip ) ;
if ( ret ! = 0 ) {
2008-02-04 12:07:15 +03:00
DEBUG ( DEBUG_ALERT , ( " Invalid --single-public-ip argument : %s . This is not a valid ip address. Exiting. \n " , options . single_public_ip ) ) ;
2007-10-10 03:42:32 +04:00
exit ( 10 ) ;
}
}
2007-08-15 08:44:03 +04:00
ret = ctdb_set_event_script_dir ( ctdb , options . event_script_dir ) ;
if ( ret = = - 1 ) {
2008-02-04 12:07:15 +03:00
DEBUG ( DEBUG_ALERT , ( " Unable to setup event script directory \n " ) ) ;
2007-08-15 08:44:03 +04:00
exit ( 1 ) ;
}
2009-03-31 07:23:31 +04:00
if ( options . notification_script ! = NULL ) {
ret = ctdb_set_notification_script ( ctdb , options . notification_script ) ;
if ( ret = = - 1 ) {
DEBUG ( DEBUG_ALERT , ( " Unable to setup notification script \n " ) ) ;
exit ( 1 ) ;
}
}
2012-05-17 04:17:51 +04:00
if ( options . debug_hung_script ! = NULL ) {
ret = ctdb_set_debug_hung_script ( ctdb , options . debug_hung_script ) ;
}
if ( ret = = - 1 ) {
DEBUG ( DEBUG_ALERT , ( " Unable to setup script to debug hung eventscripts \n " ) ) ;
exit ( 1 ) ;
}
2009-12-16 13:29:15 +03:00
ctdb - > valgrinding = options . valgrinding ;
2011-01-24 03:42:50 +03:00
if ( options . valgrinding | | options . nosetsched ) {
ctdb - > do_setsched = 0 ;
} else {
ctdb - > do_setsched = 1 ;
}
2007-07-13 02:47:02 +04:00
2012-03-22 08:27:25 +04:00
ctdb - > do_checkpublicip = ! options . no_publicipcheck ;
2009-12-07 15:28:11 +03:00
if ( options . max_persistent_check_errors < 0 ) {
ctdb - > max_persistent_check_errors = 0xFFFFFFFFFFFFFFFFLL ;
} else {
ctdb - > max_persistent_check_errors = ( uint64_t ) options . max_persistent_check_errors ;
}
2008-11-20 08:39:56 +03:00
if ( getenv ( " CTDB_BASE " ) = = NULL ) {
/* setup a environment variable for the event scripts to use
to find the installation directory */
setenv ( " CTDB_BASE " , ETCDIR " /ctdb " , 1 ) ;
}
2007-09-14 08:14:03 +04:00
2007-04-29 18:19:40 +04:00
/* start the protocol running (as a child) */
2012-05-17 10:08:37 +04:00
return ctdb_start_daemon ( ctdb , interactive ? false : true , options . use_syslog , options . public_address_list ) ;
2007-04-11 12:54:22 +04:00
}