2023-03-22 09:36:23 +01:00
/*
2007-04-10 06:03:39 +10:00
ctdb daemon code
Copyright ( C ) Andrew Tridgell 2006
2007-05-31 13:50:53 +10:00
This program is free software ; you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
2007-07-10 15:29:31 +10:00
the Free Software Foundation ; either version 3 of the License , or
2007-05-31 13:50:53 +10:00
( at your option ) any later version .
2023-03-22 09:36:23 +01:00
2007-05-31 13:50:53 +10:00
This program is distributed in the hope that it will be useful ,
2007-04-10 06:03:39 +10:00
but WITHOUT ANY WARRANTY ; without even the implied warranty of
2007-05-31 13:50:53 +10:00
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
2023-03-22 09:36:23 +01:00
2007-05-31 13:50:53 +10:00
You should have received a copy of the GNU General Public License
2007-07-10 15:29:31 +10:00
along with this program ; if not , see < http : //www.gnu.org/licenses/>.
2007-04-10 06:03:39 +10:00
*/
2015-10-26 16:50:46 +11:00
# include "replace.h"
2007-04-10 06:03:39 +10:00
# include "system/network.h"
# include "system/filesys.h"
2007-04-17 15:33:20 +10:00
# include "system/wait.h"
2015-10-26 16:50:46 +11:00
# include "system/time.h"
# include <talloc.h>
/* Allow use of deprecated function tevent_loop_allow_nesting() */
# define TEVENT_DEPRECATED
# include <tevent.h>
# include <tdb.h>
# include "lib/tdb_wrap/tdb_wrap.h"
# include "lib/util/dlinklist.h"
# include "lib/util/debug.h"
2017-08-15 12:51:59 +10:00
# include "lib/util/time.h"
2016-05-27 13:50:06 +10:00
# include "lib/util/blocking.h"
2017-08-15 12:53:02 +10:00
# include "lib/util/become_daemon.h"
2015-10-26 16:50:46 +11:00
2019-03-15 12:14:27 +11:00
# include "version.h"
2015-10-26 16:50:46 +11:00
# include "ctdb_private.h"
# include "ctdb_client.h"
# include "common/rb_tree.h"
2015-03-17 14:30:18 +11:00
# include "common/reqid.h"
2015-10-23 14:11:53 +11:00
# include "common/system.h"
2015-10-23 14:17:34 +11:00
# include "common/common.h"
2015-11-11 15:41:10 +11:00
# include "common/logging.h"
2016-09-22 14:35:03 +10:00
# include "common/pidfile.h"
2017-01-30 14:34:12 +11:00
# include "common/sock_io.h"
2007-04-10 06:03:39 +10:00
2009-12-02 13:41:04 +11:00
struct ctdb_client_pid_list {
struct ctdb_client_pid_list * next , * prev ;
struct ctdb_context * ctdb ;
pid_t pid ;
struct ctdb_client * client ;
} ;
2013-04-15 13:32:57 +10:00
const char * ctdbd_pidfile = NULL ;
2016-09-22 14:35:03 +10:00
static struct pidfile_context * ctdbd_pidfile_ctx = NULL ;
2013-04-15 13:32:57 +10:00
2007-05-19 13:45:24 +10:00
static void daemon_incoming_packet ( void * , struct ctdb_req_header * ) ;
2007-04-19 16:27:56 +10:00
2016-11-25 14:54:07 +11:00
static pid_t __ctdbd_pid ;
2007-09-24 10:00:14 +10:00
static void print_exit_message ( void )
{
2016-11-25 14:54:07 +11:00
if ( getpid ( ) = = __ctdbd_pid ) {
2013-01-10 14:39:09 +11:00
DEBUG ( DEBUG_NOTICE , ( " CTDB daemon shutting down \n " ) ) ;
2013-07-17 11:14:37 +10:00
/* Wait a second to allow pending log messages to be flushed */
sleep ( 1 ) ;
2013-01-10 14:39:09 +11:00
}
2007-09-24 10:00:14 +10:00
}
2019-01-18 17:46:37 +11:00
# ifdef HAVE_GETRUSAGE
2011-01-14 09:46:04 +11:00
2019-01-18 17:46:37 +11:00
struct cpu_check_threshold_data {
unsigned short percent ;
struct timeval timeofday ;
struct timeval ru_time ;
} ;
static void ctdb_cpu_check_threshold ( struct tevent_context * ev ,
struct tevent_timer * te ,
struct timeval tv ,
void * private_data )
{
struct ctdb_context * ctdb = talloc_get_type_abort (
private_data , struct ctdb_context ) ;
uint32_t interval = 60 ;
static unsigned short threshold = 0 ;
static struct cpu_check_threshold_data prev = {
. percent = 0 ,
. timeofday = { . tv_sec = 0 } ,
. ru_time = { . tv_sec = 0 } ,
} ;
struct rusage usage ;
struct cpu_check_threshold_data curr = {
. percent = 0 ,
} ;
int64_t ru_time_diff , timeofday_diff ;
bool first ;
int ret ;
/*
* Cache the threshold so that we don ' t waste time checking
* the environment variable every time
*/
if ( threshold = = 0 ) {
const char * t ;
threshold = 90 ;
t = getenv ( " CTDB_TEST_CPU_USAGE_THRESHOLD " ) ;
if ( t ! = NULL ) {
int th ;
th = atoi ( t ) ;
if ( th < = 0 | | th > 100 ) {
DBG_WARNING ( " Failed to parse env var: %s \n " , t ) ;
} else {
threshold = th ;
}
}
}
ret = getrusage ( RUSAGE_SELF , & usage ) ;
if ( ret ! = 0 ) {
DBG_WARNING ( " rusage() failed: %d \n " , ret ) ;
goto next ;
}
/* Sum the system and user CPU usage */
curr . ru_time = timeval_sum ( & usage . ru_utime , & usage . ru_stime ) ;
curr . timeofday = tv ;
first = timeval_is_zero ( & prev . timeofday ) ;
if ( first ) {
/* No previous values recorded so no calculation to do */
goto done ;
}
timeofday_diff = usec_time_diff ( & curr . timeofday , & prev . timeofday ) ;
if ( timeofday_diff < = 0 ) {
/*
* Time went backwards or didn ' t progress so no ( sane )
* calculation can be done
*/
goto done ;
}
ru_time_diff = usec_time_diff ( & curr . ru_time , & prev . ru_time ) ;
curr . percent = ru_time_diff * 100 / timeofday_diff ;
if ( curr . percent > = threshold ) {
/* Log only if the utilisation changes */
if ( curr . percent ! = prev . percent ) {
D_WARNING ( " WARNING: CPU utilisation %hu%% >= "
" threshold (%hu%%) \n " ,
curr . percent ,
threshold ) ;
}
} else {
/* Log if the utilisation falls below the threshold */
if ( prev . percent > = threshold ) {
D_WARNING ( " WARNING: CPU utilisation %hu%% < "
" threshold (%hu%%) \n " ,
curr . percent ,
threshold ) ;
}
}
done :
prev = curr ;
next :
tevent_add_timer ( ctdb - > ev , ctdb ,
timeval_current_ofs ( interval , 0 ) ,
ctdb_cpu_check_threshold ,
ctdb ) ;
}
static void ctdb_start_cpu_check_threshold ( struct ctdb_context * ctdb )
{
tevent_add_timer ( ctdb - > ev , ctdb ,
timeval_current ( ) ,
ctdb_cpu_check_threshold ,
ctdb ) ;
}
# endif /* HAVE_GETRUSAGE */
2011-01-14 09:46:04 +11:00
2015-10-26 16:50:09 +11:00
static void ctdb_time_tick ( struct tevent_context * ev , struct tevent_timer * te ,
2011-01-14 09:46:04 +11:00
struct timeval t , void * private_data )
{
struct ctdb_context * ctdb = talloc_get_type ( private_data , struct ctdb_context ) ;
2014-07-03 12:29:46 +10:00
if ( getpid ( ) ! = ctdb - > ctdbd_pid ) {
2011-01-14 09:46:04 +11:00
return ;
}
2015-10-26 16:50:09 +11:00
tevent_add_timer ( ctdb - > ev , ctdb ,
timeval_current_ofs ( 1 , 0 ) ,
ctdb_time_tick , ctdb ) ;
2011-01-14 09:46:04 +11:00
}
/* Used to trigger a dummy event once per second, to make
* detection of hangs more reliable .
*/
static void ctdb_start_time_tickd ( struct ctdb_context * ctdb )
{
2015-10-26 16:50:09 +11:00
tevent_add_timer ( ctdb - > ev , ctdb ,
timeval_current_ofs ( 1 , 0 ) ,
ctdb_time_tick , ctdb ) ;
2011-01-14 09:46:04 +11:00
}
2013-01-10 16:33:36 +11:00
static void ctdb_start_periodic_events ( struct ctdb_context * ctdb )
2007-05-30 13:26:50 +10:00
{
2008-01-15 08:42:12 +11:00
/* start monitoring for connected/disconnected nodes */
ctdb_start_keepalive ( ctdb ) ;
2007-07-20 15:05:55 +10:00
/* start periodic update of tcp tickle lists */
ctdb_start_tcp_tickle_update ( ctdb ) ;
2008-09-09 13:44:46 +10:00
/* start listening for recovery daemon pings */
ctdb_control_recd_ping ( ctdb ) ;
2011-01-14 09:46:04 +11:00
/* start listening to timer ticks */
ctdb_start_time_tickd ( ctdb ) ;
2019-01-18 17:46:37 +11:00
# ifdef HAVE_GETRUSAGE
ctdb_start_cpu_check_threshold ( ctdb ) ;
# endif /* HAVE_GETRUSAGE */
2007-05-30 13:26:50 +10:00
}
2014-06-06 14:58:17 +10:00
static void ignore_signal ( int signum )
2007-04-17 15:33:20 +10:00
{
struct sigaction act ;
memset ( & act , 0 , sizeof ( act ) ) ;
act . sa_handler = SIG_IGN ;
sigemptyset ( & act . sa_mask ) ;
sigaddset ( & act . sa_mask , signum ) ;
sigaction ( signum , & act , NULL ) ;
}
2007-04-10 06:03:39 +10:00
2007-04-20 20:07:47 +10:00
/*
send a packet to a client
*/
static int daemon_queue_send ( struct ctdb_client * client , struct ctdb_req_header * hdr )
{
2010-09-29 10:38:41 +10:00
CTDB_INCREMENT_STAT ( client - > ctdb , client_packets_sent ) ;
2009-10-21 15:20:55 +11:00
if ( hdr - > operation = = CTDB_REQ_MESSAGE ) {
if ( ctdb_queue_length ( client - > queue ) > client - > ctdb - > tunable . max_queue_depth_drop_msg ) {
2010-02-04 14:36:14 +11:00
DEBUG ( DEBUG_ERR , ( " CTDB_REQ_MESSAGE queue full - killing client connection. \n " ) ) ;
talloc_free ( client ) ;
return - 1 ;
2009-10-21 15:20:55 +11:00
}
}
2007-04-20 20:07:47 +10:00
return ctdb_queue_send ( client - > queue , ( uint8_t * ) hdr , hdr - > length ) ;
}
2007-04-11 11:58:28 +10:00
/*
message handler for when we are in daemon mode . This redirects the message
to the right client
*/
2015-04-08 14:38:26 +10:00
static void daemon_message_handler ( uint64_t srvid , TDB_DATA data ,
void * private_data )
2007-04-11 11:58:28 +10:00
{
2007-04-13 20:38:24 +10:00
struct ctdb_client * client = talloc_get_type ( private_data , struct ctdb_client ) ;
2015-10-29 16:36:30 +11:00
struct ctdb_req_message_old * r ;
2007-04-11 11:58:28 +10:00
int len ;
/* construct a message to send to the client containing the data */
2015-10-29 16:36:30 +11:00
len = offsetof ( struct ctdb_req_message_old , data ) + data . dsize ;
2015-04-08 14:38:26 +10:00
r = ctdbd_allocate_pkt ( client - > ctdb , client - > ctdb , CTDB_REQ_MESSAGE ,
2015-10-29 16:36:30 +11:00
len , struct ctdb_req_message_old ) ;
2015-04-08 14:38:26 +10:00
CTDB_NO_MEMORY_VOID ( client - > ctdb , r ) ;
2007-04-11 13:43:15 +10:00
2007-04-11 11:58:28 +10:00
talloc_set_name_const ( r , " req_message packet " ) ;
r - > srvid = srvid ;
r - > datalen = data . dsize ;
memcpy ( & r - > data [ 0 ] , data . dptr , data . dsize ) ;
2007-04-17 10:15:44 +10:00
2007-04-20 20:07:47 +10:00
daemon_queue_send ( client , & r - > hdr ) ;
2007-04-11 11:58:28 +10:00
talloc_free ( r ) ;
}
/*
2023-03-22 09:36:23 +01:00
this is called when the ctdb daemon received a ctdb request to
2007-04-11 11:58:28 +10:00
set the srvid from the client
*/
2007-05-04 11:41:29 +10:00
int daemon_register_message_handler ( struct ctdb_context * ctdb , uint32_t client_id , uint64_t srvid )
2007-04-11 11:58:28 +10:00
{
2015-03-17 14:30:18 +11:00
struct ctdb_client * client = reqid_find ( ctdb - > idr , client_id , struct ctdb_client ) ;
2007-04-11 11:58:28 +10:00
int res ;
2007-05-04 11:41:29 +10:00
if ( client = = NULL ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( " Bad client_id in daemon_request_register_message_handler \n " ) ) ;
2007-05-04 11:41:29 +10:00
return - 1 ;
}
2015-04-08 14:38:26 +10:00
res = srvid_register ( ctdb - > srv , client , srvid , daemon_message_handler ,
client ) ;
2007-04-11 11:58:28 +10:00
if ( res ! = 0 ) {
2023-03-22 09:36:23 +01:00
DEBUG ( DEBUG_ERR , ( __location__ " Failed to register handler %llu in daemon \n " ,
2007-05-29 13:58:41 +10:00
( unsigned long long ) srvid ) ) ;
2007-04-20 07:47:37 +10:00
} else {
2023-03-22 09:36:23 +01:00
DEBUG ( DEBUG_INFO , ( __location__ " Registered message handler for srvid=%llu \n " ,
2007-05-29 13:58:41 +10:00
( unsigned long long ) srvid ) ) ;
2007-04-11 11:58:28 +10:00
}
2007-06-19 03:54:06 +10:00
2007-05-04 11:41:29 +10:00
return res ;
}
/*
2023-03-22 09:36:23 +01:00
this is called when the ctdb daemon received a ctdb request to
2007-05-04 11:41:29 +10:00
remove a srvid from the client
*/
int daemon_deregister_message_handler ( struct ctdb_context * ctdb , uint32_t client_id , uint64_t srvid )
{
2015-03-17 14:30:18 +11:00
struct ctdb_client * client = reqid_find ( ctdb - > idr , client_id , struct ctdb_client ) ;
2007-05-04 11:41:29 +10:00
if ( client = = NULL ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( " Bad client_id in daemon_request_deregister_message_handler \n " ) ) ;
2007-05-04 11:41:29 +10:00
return - 1 ;
}
2015-04-08 14:38:26 +10:00
return srvid_deregister ( ctdb - > srv , srvid , client ) ;
2007-04-11 11:58:28 +10:00
}
2017-04-06 19:03:51 +10:00
void daemon_tunnel_handler ( uint64_t tunnel_id , TDB_DATA data ,
void * private_data )
{
struct ctdb_client * client =
talloc_get_type_abort ( private_data , struct ctdb_client ) ;
struct ctdb_req_tunnel_old * c , * pkt ;
size_t len ;
pkt = ( struct ctdb_req_tunnel_old * ) data . dptr ;
len = offsetof ( struct ctdb_req_tunnel_old , data ) + pkt - > datalen ;
c = ctdbd_allocate_pkt ( client - > ctdb , client - > ctdb , CTDB_REQ_TUNNEL ,
len , struct ctdb_req_tunnel_old ) ;
if ( c = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Memory error in daemon_tunnel_handler \n " ) ) ;
return ;
}
talloc_set_name_const ( c , " req_tunnel packet " ) ;
c - > tunnel_id = tunnel_id ;
c - > flags = pkt - > flags ;
c - > datalen = pkt - > datalen ;
memcpy ( c - > data , pkt - > data , pkt - > datalen ) ;
daemon_queue_send ( client , & c - > hdr ) ;
talloc_free ( c ) ;
}
2007-04-10 06:03:39 +10:00
/*
destroy a ctdb_client
*/
static int ctdb_client_destructor ( struct ctdb_client * client )
{
2009-07-21 11:30:38 +02:00
struct ctdb_db_context * ctdb_db ;
2007-05-27 15:26:29 +10:00
ctdb_takeover_client_destructor_hook ( client ) ;
2015-03-17 14:30:18 +11:00
reqid_remove ( client - > ctdb - > idr , client - > client_id ) ;
2013-04-19 13:29:04 +10:00
client - > ctdb - > num_clients - - ;
2008-07-17 13:50:55 +10:00
if ( client - > num_persistent_updates ! = 0 ) {
DEBUG ( DEBUG_ERR , ( __location__ " Client disconnecting with %u persistent updates in flight. Starting recovery \n " , client - > num_persistent_updates ) ) ;
client - > ctdb - > recovery_mode = CTDB_RECOVERY_ACTIVE ;
}
2009-07-21 11:30:38 +02:00
ctdb_db = find_ctdb_db ( client - > ctdb , client - > db_id ) ;
if ( ctdb_db ) {
DEBUG ( DEBUG_ERR , ( __location__ " client exit while transaction "
" commit active. Forcing recovery. \n " ) ) ;
client - > ctdb - > recovery_mode = CTDB_RECOVERY_ACTIVE ;
2011-02-23 17:37:42 +01:00
/*
* trans3 transaction state :
*
* The destructor sets the pointer to NULL .
*/
talloc_free ( ctdb_db - > persistent_state ) ;
2009-07-21 11:30:38 +02:00
}
2008-07-17 13:50:55 +10:00
2007-04-10 06:03:39 +10:00
return 0 ;
}
2007-04-11 13:43:15 +10:00
/*
this is called when the ctdb daemon received a ctdb request message
from a local client over the unix domain socket
*/
2023-03-22 09:36:23 +01:00
static void daemon_request_message_from_client ( struct ctdb_client * client ,
2015-10-29 16:36:30 +11:00
struct ctdb_req_message_old * c )
2007-04-11 13:43:15 +10:00
{
2007-04-11 14:05:01 +10:00
TDB_DATA data ;
int res ;
2012-02-13 13:24:37 +01:00
if ( c - > hdr . destnode = = CTDB_CURRENT_NODE ) {
c - > hdr . destnode = ctdb_get_pnn ( client - > ctdb ) ;
}
2007-04-11 14:05:01 +10:00
/* maybe the message is for another client on this node */
2007-09-04 10:18:44 +10:00
if ( ctdb_get_pnn ( client - > ctdb ) = = c - > hdr . destnode ) {
2007-04-11 13:43:15 +10:00
ctdb_request_message ( client - > ctdb , ( struct ctdb_req_header * ) c ) ;
2007-04-11 14:05:01 +10:00
return ;
}
2007-04-27 23:16:17 +10:00
2007-04-11 14:05:01 +10:00
/* its for a remote node */
data . dptr = & c - > data [ 0 ] ;
data . dsize = c - > datalen ;
res = ctdb_daemon_send_message ( client - > ctdb , c - > hdr . destnode ,
c - > srvid , data ) ;
if ( res ! = 0 ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Failed to send message to remote node %u \n " ,
2007-04-17 22:27:17 +10:00
c - > hdr . destnode ) ) ;
2007-04-11 13:43:15 +10:00
}
}
2007-04-19 10:37:44 +10:00
struct daemon_call_state {
struct ctdb_client * client ;
uint32_t reqid ;
struct ctdb_call * call ;
2007-04-20 20:07:47 +10:00
struct timeval start_time ;
2012-01-31 17:20:35 +11:00
/* readonly request ? */
uint32_t readonly_fetch ;
uint32_t client_callid ;
2007-04-19 10:37:44 +10:00
} ;
2023-03-22 09:36:23 +01:00
/*
complete a call from a client
2007-04-19 10:37:44 +10:00
*/
static void daemon_call_from_client_callback ( struct ctdb_call_state * state )
2007-04-10 06:03:39 +10:00
{
2023-03-22 09:36:23 +01:00
struct daemon_call_state * dstate = talloc_get_type ( state - > async . private_data ,
2007-04-19 10:37:44 +10:00
struct daemon_call_state ) ;
2015-10-29 16:29:01 +11:00
struct ctdb_reply_call_old * r ;
2007-04-10 06:03:39 +10:00
int res ;
2007-04-11 11:01:42 +10:00
uint32_t length ;
2007-04-19 10:37:44 +10:00
struct ctdb_client * client = dstate - > client ;
2008-11-03 21:54:52 +11:00
struct ctdb_db_context * ctdb_db = state - > ctdb_db ;
2007-04-10 06:03:39 +10:00
2007-04-19 10:37:44 +10:00
talloc_steal ( client , dstate ) ;
talloc_steal ( dstate , dstate - > call ) ;
2007-04-10 06:03:39 +10:00
2007-04-19 10:37:44 +10:00
res = ctdb_daemon_call_recv ( state , dstate - > call ) ;
2007-04-10 06:03:39 +10:00
if ( res ! = 0 ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " ctdbd_call_recv() returned error \n " ) ) ;
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( client - > ctdb , pending_calls ) ;
2010-10-11 15:11:18 +11:00
CTDB_UPDATE_LATENCY ( client - > ctdb , ctdb_db , " call_from_client_cb 1 " , call_latency , dstate - > start_time ) ;
2007-04-19 10:37:44 +10:00
return ;
2007-04-10 06:03:39 +10:00
}
2015-10-29 16:29:01 +11:00
length = offsetof ( struct ctdb_reply_call_old , data ) + dstate - > call - > reply_data . dsize ;
2023-03-22 09:36:23 +01:00
/* If the client asked for readonly FETCH, we remapped this to
2012-01-31 17:20:35 +11:00
FETCH_WITH_HEADER when calling the daemon . So we must
strip the extra header off the reply data before passing
it back to the client .
*/
if ( dstate - > readonly_fetch
& & dstate - > client_callid = = CTDB_FETCH_FUNC ) {
length - = sizeof ( struct ctdb_ltdb_header ) ;
}
2023-03-22 09:36:23 +01:00
r = ctdbd_allocate_pkt ( client - > ctdb , dstate , CTDB_REPLY_CALL ,
2015-10-29 16:29:01 +11:00
length , struct ctdb_reply_call_old ) ;
2007-04-11 11:01:42 +10:00
if ( r = = NULL ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Failed to allocate reply_call in ctdb daemon \n " ) ) ;
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( client - > ctdb , pending_calls ) ;
2010-10-11 15:11:18 +11:00
CTDB_UPDATE_LATENCY ( client - > ctdb , ctdb_db , " call_from_client_cb 2 " , call_latency , dstate - > start_time ) ;
2007-04-11 11:01:42 +10:00
return ;
}
2007-04-19 10:37:44 +10:00
r - > hdr . reqid = dstate - > reqid ;
2011-07-20 15:17:29 +10:00
r - > status = dstate - > call - > status ;
2012-01-31 17:20:35 +11:00
if ( dstate - > readonly_fetch
& & dstate - > client_callid = = CTDB_FETCH_FUNC ) {
/* client only asked for a FETCH so we must strip off
the extra ctdb_ltdb header
*/
r - > datalen = dstate - > call - > reply_data . dsize - sizeof ( struct ctdb_ltdb_header ) ;
memcpy ( & r - > data [ 0 ] , dstate - > call - > reply_data . dptr + sizeof ( struct ctdb_ltdb_header ) , r - > datalen ) ;
} else {
r - > datalen = dstate - > call - > reply_data . dsize ;
memcpy ( & r - > data [ 0 ] , dstate - > call - > reply_data . dptr , r - > datalen ) ;
}
2007-04-11 11:01:42 +10:00
2007-04-20 20:07:47 +10:00
res = daemon_queue_send ( client , & r - > hdr ) ;
2010-02-04 14:36:14 +11:00
if ( res = = - 1 ) {
/* client is dead - return immediately */
return ;
}
2007-04-11 11:01:42 +10:00
if ( res ! = 0 ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Failed to queue packet from daemon to client \n " ) ) ;
2007-04-10 06:03:39 +10:00
}
2010-10-11 15:11:18 +11:00
CTDB_UPDATE_LATENCY ( client - > ctdb , ctdb_db , " call_from_client_cb 3 " , call_latency , dstate - > start_time ) ;
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( client - > ctdb , pending_calls ) ;
2007-04-19 10:37:44 +10:00
talloc_free ( dstate ) ;
2007-04-10 06:03:39 +10:00
}
2008-01-16 09:44:48 +11:00
struct ctdb_daemon_packet_wrap {
struct ctdb_context * ctdb ;
uint32_t client_id ;
} ;
/*
a wrapper to catch disconnected clients
*/
static void daemon_incoming_packet_wrap ( void * p , struct ctdb_req_header * hdr )
{
struct ctdb_client * client ;
2023-03-22 09:36:23 +01:00
struct ctdb_daemon_packet_wrap * w = talloc_get_type ( p ,
2008-01-16 09:44:48 +11:00
struct ctdb_daemon_packet_wrap ) ;
if ( w = = NULL ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_CRIT , ( __location__ " Bad packet type '%s' \n " , talloc_get_name ( p ) ) ) ;
2008-01-16 09:44:48 +11:00
return ;
}
2015-03-17 14:30:18 +11:00
client = reqid_find ( w - > ctdb - > idr , w - > client_id , struct ctdb_client ) ;
2008-01-16 09:44:48 +11:00
if ( client = = NULL ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Packet for disconnected client %u \n " ,
2008-01-16 09:44:48 +11:00
w - > client_id ) ) ;
talloc_free ( w ) ;
return ;
}
talloc_free ( w ) ;
/* process it */
2023-03-22 09:36:23 +01:00
daemon_incoming_packet ( client , hdr ) ;
2008-01-16 09:44:48 +11:00
}
2007-04-19 16:27:56 +10:00
2011-11-08 06:55:46 +11:00
struct ctdb_deferred_fetch_call {
struct ctdb_deferred_fetch_call * next , * prev ;
2015-10-29 16:26:29 +11:00
struct ctdb_req_call_old * c ;
2011-11-08 06:55:46 +11:00
struct ctdb_daemon_packet_wrap * w ;
} ;
struct ctdb_deferred_fetch_queue {
struct ctdb_deferred_fetch_call * deferred_calls ;
} ;
struct ctdb_deferred_requeue {
struct ctdb_deferred_fetch_call * dfc ;
struct ctdb_client * client ;
} ;
/* called from a timer event and starts reprocessing the deferred call.*/
2015-10-26 16:50:09 +11:00
static void reprocess_deferred_call ( struct tevent_context * ev ,
struct tevent_timer * te ,
struct timeval t , void * private_data )
2011-11-08 06:55:46 +11:00
{
struct ctdb_deferred_requeue * dfr = ( struct ctdb_deferred_requeue * ) private_data ;
struct ctdb_client * client = dfr - > client ;
talloc_steal ( client , dfr - > dfc - > c ) ;
daemon_incoming_packet ( client , ( struct ctdb_req_header * ) dfr - > dfc - > c ) ;
talloc_free ( dfr ) ;
}
/* the referral context is destroyed either after a timeout or when the initial
fetch - lock has finished .
at this stage , immediately start reprocessing the queued up deferred
calls so they get reprocessed immediately ( and since we are dmaster at
2019-10-26 02:41:09 +02:00
this stage , trigger the waiting smbd processes to pick up and acquire the
2011-11-08 06:55:46 +11:00
record right away .
*/
static int deferred_fetch_queue_destructor ( struct ctdb_deferred_fetch_queue * dfq )
{
2019-10-26 02:41:09 +02:00
/* need to reprocess the packets from the queue explicitly instead of
just using a normal destructor since we need to
call the clients in the same order as the requests queued up
2011-11-08 06:55:46 +11:00
*/
while ( dfq - > deferred_calls ! = NULL ) {
struct ctdb_client * client ;
struct ctdb_deferred_fetch_call * dfc = dfq - > deferred_calls ;
struct ctdb_deferred_requeue * dfr ;
DLIST_REMOVE ( dfq - > deferred_calls , dfc ) ;
2015-03-17 14:30:18 +11:00
client = reqid_find ( dfc - > w - > ctdb - > idr , dfc - > w - > client_id , struct ctdb_client ) ;
2011-11-08 06:55:46 +11:00
if ( client = = NULL ) {
DEBUG ( DEBUG_ERR , ( __location__ " Packet for disconnected client %u \n " ,
dfc - > w - > client_id ) ) ;
continue ;
}
/* process it by pushing it back onto the eventloop */
dfr = talloc ( client , struct ctdb_deferred_requeue ) ;
if ( dfr = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Failed to allocate deferred fetch requeue structure \n " ) ) ;
continue ;
}
dfr - > dfc = talloc_steal ( dfr , dfc ) ;
dfr - > client = client ;
2015-10-26 16:50:09 +11:00
tevent_add_timer ( dfc - > w - > ctdb - > ev , client , timeval_zero ( ) ,
reprocess_deferred_call , dfr ) ;
2011-11-08 06:55:46 +11:00
}
return 0 ;
}
/* insert the new deferral context into the rb tree.
there should never be a pre - existing context here , but check for it
warn and destroy the previous context if there is already a deferral context
for this key .
*/
static void * insert_dfq_callback ( void * parm , void * data )
{
if ( data ) {
DEBUG ( DEBUG_ERR , ( " Already have DFQ registered. Free old %p and create new %p \n " , data , parm ) ) ;
talloc_free ( data ) ;
}
return parm ;
}
/* if the original fetch-lock did not complete within a reasonable time,
free the context and context for all deferred requests to cause them to be
re - inserted into the event system .
*/
2015-10-26 16:50:09 +11:00
static void dfq_timeout ( struct tevent_context * ev , struct tevent_timer * te ,
struct timeval t , void * private_data )
2011-11-08 06:55:46 +11:00
{
talloc_free ( private_data ) ;
}
/* This function is used in the local daemon to register a KEY in a database
for being " fetched "
2023-03-22 09:36:23 +01:00
While the remote fetch is in - flight , any further attempts to re - fetch the
2011-11-08 06:55:46 +11:00
same record will be deferred until the fetch completes .
*/
static int setup_deferred_fetch_locks ( struct ctdb_db_context * ctdb_db , struct ctdb_call * call )
{
uint32_t * k ;
struct ctdb_deferred_fetch_queue * dfq ;
2014-08-15 13:33:24 +10:00
k = ctdb_key_to_idkey ( call , call - > key ) ;
2011-11-08 06:55:46 +11:00
if ( k = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Failed to allocate key for deferred fetch \n " ) ) ;
return - 1 ;
}
dfq = talloc ( call , struct ctdb_deferred_fetch_queue ) ;
if ( dfq = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Failed to allocate key for deferred fetch queue structure \n " ) ) ;
talloc_free ( k ) ;
return - 1 ;
}
dfq - > deferred_calls = NULL ;
trbt_insertarray32_callback ( ctdb_db - > deferred_fetch , k [ 0 ] , & k [ 0 ] , insert_dfq_callback , dfq ) ;
talloc_set_destructor ( dfq , deferred_fetch_queue_destructor ) ;
2023-03-22 09:36:23 +01:00
/* If the fetch hasn't completed in 30 seconds, just tear it all down
2011-11-08 06:55:46 +11:00
and let it try again as the events are reissued */
2015-10-26 16:50:09 +11:00
tevent_add_timer ( ctdb_db - > ctdb - > ev , dfq , timeval_current_ofs ( 30 , 0 ) ,
dfq_timeout , dfq ) ;
2011-11-08 06:55:46 +11:00
talloc_free ( k ) ;
return 0 ;
}
/* check if this is a duplicate request to a fetch already in-flight
if it is , make this call deferred to be reprocessed later when
the in - flight fetch completes .
*/
2015-10-29 16:26:29 +11:00
static int requeue_duplicate_fetch ( struct ctdb_db_context * ctdb_db , struct ctdb_client * client , TDB_DATA key , struct ctdb_req_call_old * c )
2011-11-08 06:55:46 +11:00
{
uint32_t * k ;
struct ctdb_deferred_fetch_queue * dfq ;
struct ctdb_deferred_fetch_call * dfc ;
2014-08-15 13:33:24 +10:00
k = ctdb_key_to_idkey ( c , key ) ;
2011-11-08 06:55:46 +11:00
if ( k = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Failed to allocate key for deferred fetch \n " ) ) ;
return - 1 ;
}
dfq = trbt_lookuparray32 ( ctdb_db - > deferred_fetch , k [ 0 ] , & k [ 0 ] ) ;
if ( dfq = = NULL ) {
talloc_free ( k ) ;
return - 1 ;
}
talloc_free ( k ) ;
dfc = talloc ( dfq , struct ctdb_deferred_fetch_call ) ;
if ( dfc = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Failed to allocate deferred fetch call structure \n " ) ) ;
return - 1 ;
}
dfc - > w = talloc ( dfc , struct ctdb_daemon_packet_wrap ) ;
if ( dfc - > w = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Failed to allocate deferred fetch daemon packet wrap structure \n " ) ) ;
talloc_free ( dfc ) ;
return - 1 ;
}
dfc - > c = talloc_steal ( dfc , c ) ;
dfc - > w - > ctdb = ctdb_db - > ctdb ;
dfc - > w - > client_id = client - > client_id ;
2016-02-05 11:32:18 +01:00
DLIST_ADD_END ( dfq - > deferred_calls , dfc ) ;
2011-11-08 06:55:46 +11:00
return 0 ;
}
2007-05-10 07:43:18 +10:00
2007-04-19 10:37:44 +10:00
/*
this is called when the ctdb daemon received a ctdb request call
from a local client over the unix domain socket
*/
2023-03-22 09:36:23 +01:00
static void daemon_request_call_from_client ( struct ctdb_client * client ,
2015-10-29 16:26:29 +11:00
struct ctdb_req_call_old * c )
2007-04-19 10:37:44 +10:00
{
struct ctdb_call_state * state ;
struct ctdb_db_context * ctdb_db ;
struct daemon_call_state * dstate ;
struct ctdb_call * call ;
2007-04-19 16:27:56 +10:00
struct ctdb_ltdb_header header ;
TDB_DATA key , data ;
int ret ;
struct ctdb_context * ctdb = client - > ctdb ;
2008-01-16 09:44:48 +11:00
struct ctdb_daemon_packet_wrap * w ;
2007-04-19 10:37:44 +10:00
2010-09-29 10:38:41 +10:00
CTDB_INCREMENT_STAT ( ctdb , total_calls ) ;
2014-09-09 19:01:55 +10:00
CTDB_INCREMENT_STAT ( ctdb , pending_calls ) ;
2007-04-20 20:07:47 +10:00
2007-04-19 10:37:44 +10:00
ctdb_db = find_ctdb_db ( client - > ctdb , c - > db_id ) ;
if ( ! ctdb_db ) {
2023-08-07 16:32:34 +12:00
DEBUG ( DEBUG_ERR , ( __location__ " Unknown database in request. db_id==0x%08x \n " ,
2007-04-19 10:37:44 +10:00
c - > db_id ) ) ;
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2007-04-19 10:37:44 +10:00
return ;
}
2009-12-07 13:28:11 +01:00
if ( ctdb_db - > unhealthy_reason ) {
/*
* this is just a warning , as the tdb should be empty anyway ,
* and only persistent databases can be unhealthy , which doesn ' t
* use this code patch
*/
DEBUG ( DEBUG_WARNING , ( " warn: db(%s) unhealty in daemon_request_call_from_client(): %s \n " ,
ctdb_db - > db_name , ctdb_db - > unhealthy_reason ) ) ;
}
2007-04-19 16:27:56 +10:00
key . dptr = c - > data ;
key . dsize = c - > keylen ;
2008-01-16 09:44:48 +11:00
w = talloc ( ctdb , struct ctdb_daemon_packet_wrap ) ;
2023-03-22 09:36:23 +01:00
CTDB_NO_MEMORY_VOID ( ctdb , w ) ;
2008-01-16 09:44:48 +11:00
w - > ctdb = ctdb ;
w - > client_id = client - > client_id ;
2023-03-22 09:36:23 +01:00
ret = ctdb_ltdb_lock_fetch_requeue ( ctdb_db , key , & header ,
2007-04-19 16:27:56 +10:00
( struct ctdb_req_header * ) c , & data ,
2012-05-17 16:08:37 +10:00
daemon_incoming_packet_wrap , w , true ) ;
2007-04-19 16:27:56 +10:00
if ( ret = = - 2 ) {
/* will retry later */
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2007-04-19 16:27:56 +10:00
return ;
}
2008-01-16 09:44:48 +11:00
talloc_free ( w ) ;
2007-04-19 16:27:56 +10:00
if ( ret ! = 0 ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Unable to fetch record \n " ) ) ;
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2007-04-19 16:27:56 +10:00
return ;
}
2012-03-20 11:31:59 +11:00
/* check if this fetch request is a duplicate for a
request we already have in flight . If so defer it until
the first request completes .
*/
if ( ctdb - > tunable . fetch_collapse = = 1 ) {
2011-11-08 06:55:46 +11:00
if ( requeue_duplicate_fetch ( ctdb_db , client , key , c ) = = 0 ) {
ret = ctdb_ltdb_unlock ( ctdb_db , key ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( __location__ " ctdb_ltdb_unlock() failed with error %d \n " , ret ) ) ;
}
2014-09-12 10:50:27 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2017-09-11 15:59:19 +10:00
talloc_free ( data . dptr ) ;
2011-11-08 06:55:46 +11:00
return ;
}
}
2015-07-26 23:02:57 +02:00
/* Dont do READONLY if we don't have a tracking database */
2017-03-02 15:44:48 +11:00
if ( ( c - > flags & CTDB_WANT_READONLY ) & & ! ctdb_db_readonly ( ctdb_db ) ) {
2011-07-20 15:17:29 +10:00
c - > flags & = ~ CTDB_WANT_READONLY ;
}
if ( header . flags & CTDB_REC_RO_REVOKE_COMPLETE ) {
2013-04-19 16:23:16 +02:00
header . flags & = ~ CTDB_REC_RO_FLAGS ;
2012-02-08 13:42:30 +11:00
CTDB_INCREMENT_STAT ( ctdb , total_ro_revokes ) ;
2012-02-08 15:29:27 +11:00
CTDB_INCREMENT_DB_STAT ( ctdb_db , db_ro_revokes ) ;
2011-07-20 15:17:29 +10:00
if ( ctdb_ltdb_store ( ctdb_db , key , & header , data ) ! = 0 ) {
ctdb_fatal ( ctdb , " Failed to write header with cleared REVOKE flag " ) ;
}
2011-08-17 16:14:57 +10:00
/* and clear out the tracking data */
if ( tdb_delete ( ctdb_db - > rottdb , key ) ! = 0 ) {
DEBUG ( DEBUG_ERR , ( __location__ " Failed to clear out trackingdb record \n " ) ) ;
}
2011-07-20 15:17:29 +10:00
}
/* if we are revoking, we must defer all other calls until the revoke
* had completed .
*/
if ( header . flags & CTDB_REC_RO_REVOKING_READONLY ) {
talloc_free ( data . dptr ) ;
ret = ctdb_ltdb_unlock ( ctdb_db , key ) ;
if ( ctdb_add_revoke_deferred_call ( ctdb , ctdb_db , key , ( struct ctdb_req_header * ) c , daemon_incoming_packet , client ) ! = 0 ) {
ctdb_fatal ( ctdb , " Failed to add deferred call for revoke child " ) ;
}
2014-09-12 10:50:27 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2011-07-20 15:17:29 +10:00
return ;
}
if ( ( header . dmaster = = ctdb - > pnn )
& & ( ! ( c - > flags & CTDB_WANT_READONLY ) )
& & ( header . flags & ( CTDB_REC_RO_HAVE_DELEGATIONS | CTDB_REC_RO_HAVE_READONLY ) ) ) {
header . flags | = CTDB_REC_RO_REVOKING_READONLY ;
if ( ctdb_ltdb_store ( ctdb_db , key , & header , data ) ! = 0 ) {
ctdb_fatal ( ctdb , " Failed to store record with HAVE_DELEGATIONS set " ) ;
}
ret = ctdb_ltdb_unlock ( ctdb_db , key ) ;
if ( ctdb_start_revoke_ro_record ( ctdb , ctdb_db , key , & header , data ) ! = 0 ) {
ctdb_fatal ( ctdb , " Failed to start record revoke " ) ;
}
talloc_free ( data . dptr ) ;
if ( ctdb_add_revoke_deferred_call ( ctdb , ctdb_db , key , ( struct ctdb_req_header * ) c , daemon_incoming_packet , client ) ! = 0 ) {
ctdb_fatal ( ctdb , " Failed to add deferred call for revoke child " ) ;
}
2014-09-12 10:50:27 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2011-07-20 15:17:29 +10:00
return ;
2023-03-22 09:36:23 +01:00
}
2011-07-20 15:17:29 +10:00
2007-04-19 10:37:44 +10:00
dstate = talloc ( client , struct daemon_call_state ) ;
if ( dstate = = NULL ) {
2010-06-09 14:17:35 +10:00
ret = ctdb_ltdb_unlock ( ctdb_db , key ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( __location__ " ctdb_ltdb_unlock() failed with error %d \n " , ret ) ) ;
}
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Unable to allocate dstate \n " ) ) ;
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2007-04-19 10:37:44 +10:00
return ;
}
2007-04-20 20:07:47 +10:00
dstate - > start_time = timeval_current ( ) ;
2007-04-19 10:37:44 +10:00
dstate - > client = client ;
dstate - > reqid = c - > hdr . reqid ;
2007-04-19 16:27:56 +10:00
talloc_steal ( dstate , data . dptr ) ;
2007-04-19 10:37:44 +10:00
call = dstate - > call = talloc_zero ( dstate , struct ctdb_call ) ;
if ( call = = NULL ) {
2010-06-09 14:17:35 +10:00
ret = ctdb_ltdb_unlock ( ctdb_db , key ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( __location__ " ctdb_ltdb_unlock() failed with error %d \n " , ret ) ) ;
}
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Unable to allocate call \n " ) ) ;
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2010-10-11 15:11:18 +11:00
CTDB_UPDATE_LATENCY ( ctdb , ctdb_db , " call_from_client 1 " , call_latency , dstate - > start_time ) ;
2007-04-19 10:37:44 +10:00
return ;
}
2012-01-31 17:20:35 +11:00
dstate - > readonly_fetch = 0 ;
2007-04-19 10:37:44 +10:00
call - > call_id = c - > callid ;
2007-04-19 16:27:56 +10:00
call - > key = key ;
2007-04-19 10:37:44 +10:00
call - > call_data . dptr = c - > data + c - > keylen ;
call - > call_data . dsize = c - > calldatalen ;
2007-04-19 17:44:45 +02:00
call - > flags = c - > flags ;
2007-04-19 10:37:44 +10:00
2012-01-31 17:20:35 +11:00
if ( c - > flags & CTDB_WANT_READONLY ) {
2023-03-22 09:36:23 +01:00
/* client wants readonly record, so translate this into a
2012-01-31 17:20:35 +11:00
fetch with header . remember what the client asked for
so we can remap the reply back to the proper format for
the client in the reply
*/
dstate - > client_callid = call - > call_id ;
call - > call_id = CTDB_FETCH_WITH_HEADER_FUNC ;
dstate - > readonly_fetch = 1 ;
}
2007-09-04 10:06:36 +10:00
if ( header . dmaster = = ctdb - > pnn ) {
2007-04-19 16:27:56 +10:00
state = ctdb_call_local_send ( ctdb_db , call , & header , & data ) ;
} else {
state = ctdb_daemon_call_send_remote ( ctdb_db , call , & header ) ;
2012-03-20 11:31:59 +11:00
if ( ctdb - > tunable . fetch_collapse = = 1 ) {
2011-11-08 06:55:46 +11:00
/* This request triggered a remote fetch-lock.
set up a deferral for this key so any additional
fetch - locks are deferred until the current one
finishes .
*/
setup_deferred_fetch_locks ( ctdb_db , call ) ;
}
2007-04-19 16:27:56 +10:00
}
2010-06-09 14:17:35 +10:00
ret = ctdb_ltdb_unlock ( ctdb_db , key ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( __location__ " ctdb_ltdb_unlock() failed with error %d \n " , ret ) ) ;
}
2007-04-19 16:27:56 +10:00
2007-04-19 10:37:44 +10:00
if ( state = = NULL ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Unable to setup call send \n " ) ) ;
2010-09-29 10:38:41 +10:00
CTDB_DECREMENT_STAT ( ctdb , pending_calls ) ;
2010-10-11 15:11:18 +11:00
CTDB_UPDATE_LATENCY ( ctdb , ctdb_db , " call_from_client 2 " , call_latency , dstate - > start_time ) ;
2007-04-19 10:37:44 +10:00
return ;
}
talloc_steal ( state , dstate ) ;
talloc_steal ( client , state ) ;
state - > async . fn = daemon_call_from_client_callback ;
state - > async . private_data = dstate ;
}
2007-04-10 06:03:39 +10:00
2007-04-26 14:27:49 +02:00
2023-03-22 09:36:23 +01:00
static void daemon_request_control_from_client ( struct ctdb_client * client ,
2015-10-29 16:42:05 +11:00
struct ctdb_req_control_old * c ) ;
2017-04-06 19:09:58 +10:00
static void daemon_request_tunnel_from_client ( struct ctdb_client * client ,
struct ctdb_req_tunnel_old * c ) ;
2007-04-26 14:27:49 +02:00
2007-04-10 06:03:39 +10:00
/* data contains a packet from the client */
2007-05-19 13:45:24 +10:00
static void daemon_incoming_packet ( void * p , struct ctdb_req_header * hdr )
2007-04-10 06:03:39 +10:00
{
2007-04-19 16:27:56 +10:00
struct ctdb_client * client = talloc_get_type ( p , struct ctdb_client ) ;
2007-04-18 11:20:24 +10:00
TALLOC_CTX * tmp_ctx ;
2007-04-20 21:02:53 +10:00
struct ctdb_context * ctdb = client - > ctdb ;
2007-04-18 11:20:24 +10:00
/* place the packet as a child of a tmp_ctx. We then use
talloc_free ( ) below to free it . If any of the calls want
to keep it , then they will steal it somewhere else , and the
talloc_free ( ) will be a no - op */
tmp_ctx = talloc_new ( client ) ;
talloc_steal ( tmp_ctx , hdr ) ;
2007-04-10 06:03:39 +10:00
if ( hdr - > ctdb_magic ! = CTDB_MAGIC ) {
2007-04-17 10:15:44 +10:00
ctdb_set_error ( client - > ctdb , " Non CTDB packet rejected in daemon \n " ) ;
2007-04-11 14:05:01 +10:00
goto done ;
2007-04-10 06:03:39 +10:00
}
2014-10-21 11:53:29 +11:00
if ( hdr - > ctdb_version ! = CTDB_PROTOCOL ) {
2007-04-17 10:15:44 +10:00
ctdb_set_error ( client - > ctdb , " Bad CTDB version 0x%x rejected in daemon \n " , hdr - > ctdb_version ) ;
2007-04-11 14:05:01 +10:00
goto done ;
2007-04-10 06:03:39 +10:00
}
switch ( hdr - > operation ) {
case CTDB_REQ_CALL :
2010-09-29 10:38:41 +10:00
CTDB_INCREMENT_STAT ( ctdb , client . req_call ) ;
2015-10-29 16:26:29 +11:00
daemon_request_call_from_client ( client , ( struct ctdb_req_call_old * ) hdr ) ;
2007-04-10 06:03:39 +10:00
break ;
2007-04-11 13:43:15 +10:00
case CTDB_REQ_MESSAGE :
2010-09-29 10:38:41 +10:00
CTDB_INCREMENT_STAT ( ctdb , client . req_message ) ;
2015-10-29 16:36:30 +11:00
daemon_request_message_from_client ( client , ( struct ctdb_req_message_old * ) hdr ) ;
2007-04-11 13:43:15 +10:00
break ;
2007-04-11 14:54:47 +10:00
2007-04-26 14:27:49 +02:00
case CTDB_REQ_CONTROL :
2010-09-29 10:38:41 +10:00
CTDB_INCREMENT_STAT ( ctdb , client . req_control ) ;
2015-10-29 16:42:05 +11:00
daemon_request_control_from_client ( client , ( struct ctdb_req_control_old * ) hdr ) ;
2007-04-26 14:27:49 +02:00
break ;
2017-04-06 19:09:58 +10:00
case CTDB_REQ_TUNNEL :
CTDB_INCREMENT_STAT ( ctdb , client . req_tunnel ) ;
daemon_request_tunnel_from_client ( client , ( struct ctdb_req_tunnel_old * ) hdr ) ;
break ;
2007-04-13 09:41:15 +10:00
default :
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_CRIT , ( __location__ " daemon: unrecognized operation %u \n " ,
2007-04-17 22:27:17 +10:00
hdr - > operation ) ) ;
2007-04-10 06:03:39 +10:00
}
2007-04-11 14:05:01 +10:00
done :
2007-04-18 11:20:24 +10:00
talloc_free ( tmp_ctx ) ;
2007-04-10 06:03:39 +10:00
}
2007-04-20 20:07:47 +10:00
/*
called when the daemon gets a incoming packet
*/
2007-04-17 14:52:51 +10:00
static void ctdb_daemon_read_cb ( uint8_t * data , size_t cnt , void * args )
2007-04-10 06:03:39 +10:00
{
2007-04-10 08:38:29 +10:00
struct ctdb_client * client = talloc_get_type ( args , struct ctdb_client ) ;
struct ctdb_req_header * hdr ;
2007-04-11 13:17:36 +02:00
if ( cnt = = 0 ) {
talloc_free ( client ) ;
return ;
}
2010-09-29 10:38:41 +10:00
CTDB_INCREMENT_STAT ( client - > ctdb , client_packets_recv ) ;
2007-04-20 20:07:47 +10:00
2007-04-10 08:38:29 +10:00
if ( cnt < sizeof ( * hdr ) ) {
2023-03-22 09:36:23 +01:00
ctdb_set_error ( client - > ctdb , " Bad packet length %u in daemon \n " ,
2007-04-28 11:35:49 +02:00
( unsigned ) cnt ) ;
2007-04-10 06:03:39 +10:00
return ;
}
2007-04-10 08:38:29 +10:00
hdr = ( struct ctdb_req_header * ) data ;
2007-04-10 06:03:39 +10:00
2007-04-10 08:38:29 +10:00
if ( hdr - > ctdb_magic ! = CTDB_MAGIC ) {
ctdb_set_error ( client - > ctdb , " Non CTDB packet rejected \n " ) ;
2018-03-13 09:06:45 +01:00
goto err_out ;
2007-04-10 06:03:39 +10:00
}
2014-10-21 11:53:29 +11:00
if ( hdr - > ctdb_version ! = CTDB_PROTOCOL ) {
2007-04-17 10:15:44 +10:00
ctdb_set_error ( client - > ctdb , " Bad CTDB version 0x%x rejected in daemon \n " , hdr - > ctdb_version ) ;
2018-03-13 09:06:45 +01:00
goto err_out ;
2007-04-10 06:03:39 +10:00
}
2008-02-04 17:44:24 +11:00
DEBUG ( DEBUG_DEBUG , ( __location__ " client request %u of type %u length %u from "
2007-05-23 20:15:09 +10:00
" node %u to %u \n " , hdr - > reqid , hdr - > operation , hdr - > length ,
2007-04-20 20:07:47 +10:00
hdr - > srcnode , hdr - > destnode ) ) ;
2007-04-10 08:38:29 +10:00
/* it is the responsibility of the incoming packet function to free 'data' */
2007-05-19 13:45:24 +10:00
daemon_incoming_packet ( client , hdr ) ;
2018-03-13 09:06:45 +01:00
return ;
err_out :
TALLOC_FREE ( data ) ;
2007-04-10 08:38:29 +10:00
}
2007-04-10 06:03:39 +10:00
2009-12-02 13:41:04 +11:00
static int ctdb_clientpid_destructor ( struct ctdb_client_pid_list * client_pid )
{
if ( client_pid - > ctdb - > client_pids ! = NULL ) {
DLIST_REMOVE ( client_pid - > ctdb - > client_pids , client_pid ) ;
}
return 0 ;
}
2019-05-06 15:22:49 +10:00
static int get_new_client_id ( struct reqid_context * idr ,
struct ctdb_client * client ,
uint32_t * out )
{
uint32_t client_id ;
client_id = reqid_new ( idr , client ) ;
/*
* Some places in the code ( e . g . ctdb_control_db_attach ( ) ,
* ctdb_control_db_detach ( ) ) assign a special meaning to
* client_id 0. The assumption is that if client_id is 0 then
* the control has come from another daemon . Therefore , we
* should never return client_id = = 0.
*/
if ( client_id = = 0 ) {
/*
* Don ' t leak ID 0. This is safe because the ID keeps
* increasing . A test will be added to ensure that
* this doesn ' t change .
*/
reqid_remove ( idr , 0 ) ;
client_id = reqid_new ( idr , client ) ;
}
if ( client_id = = REQID_INVALID ) {
return EINVAL ;
}
if ( client_id = = 0 ) {
/* Every other ID must have been used and we can't use 0 */
reqid_remove ( idr , 0 ) ;
return EINVAL ;
}
* out = client_id ;
return 0 ;
}
2009-12-02 13:41:04 +11:00
2015-10-26 16:50:09 +11:00
static void ctdb_accept_client ( struct tevent_context * ev ,
struct tevent_fd * fde , uint16_t flags ,
void * private_data )
2007-04-10 06:03:39 +10:00
{
2008-08-19 14:58:29 +10:00
struct sockaddr_un addr ;
2007-04-10 06:03:39 +10:00
socklen_t len ;
int fd ;
2007-04-13 20:38:24 +10:00
struct ctdb_context * ctdb = talloc_get_type ( private_data , struct ctdb_context ) ;
2007-04-10 06:03:39 +10:00
struct ctdb_client * client ;
2009-12-02 13:41:04 +11:00
struct ctdb_client_pid_list * client_pid ;
2011-11-05 19:04:40 +01:00
pid_t peer_pid = 0 ;
2016-08-10 17:35:22 +10:00
int ret ;
2007-04-10 06:03:39 +10:00
memset ( & addr , 0 , sizeof ( addr ) ) ;
len = sizeof ( addr ) ;
fd = accept ( ctdb - > daemon . sd , ( struct sockaddr * ) & addr , & len ) ;
if ( fd = = - 1 ) {
return ;
}
2017-12-11 09:36:08 +13:00
smb_set_close_on_exec ( fd ) ;
2007-05-30 15:43:25 +10:00
2016-08-10 17:35:22 +10:00
ret = set_blocking ( fd , false ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR ,
( __location__
" failed to set socket non-blocking (%s) \n " ,
strerror ( errno ) ) ) ;
close ( fd ) ;
return ;
}
2007-05-30 15:43:25 +10:00
set_close_on_exec ( fd ) ;
2009-10-15 11:24:54 +11:00
2009-10-21 15:26:24 +11:00
DEBUG ( DEBUG_DEBUG , ( __location__ " Created SOCKET FD:%d to connected child \n " , fd ) ) ;
2007-04-10 06:03:39 +10:00
client = talloc_zero ( ctdb , struct ctdb_client ) ;
2011-11-05 19:04:40 +01:00
if ( ctdb_get_peer_pid ( fd , & peer_pid ) = = 0 ) {
DEBUG ( DEBUG_INFO , ( " Connected client with pid:%u \n " , ( unsigned ) peer_pid ) ) ;
2008-04-01 15:34:54 +11:00
}
2007-04-10 06:03:39 +10:00
client - > ctdb = ctdb ;
client - > fd = fd ;
2019-05-06 15:22:49 +10:00
ret = get_new_client_id ( ctdb - > idr , client , & client - > client_id ) ;
if ( ret ! = 0 ) {
DBG_ERR ( " Unable to get client ID (%d) \n " , ret ) ;
close ( fd ) ;
talloc_free ( client ) ;
return ;
}
2011-11-05 19:04:40 +01:00
client - > pid = peer_pid ;
2009-12-02 13:41:04 +11:00
client_pid = talloc ( client , struct ctdb_client_pid_list ) ;
if ( client_pid = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Failed to allocate client pid structure \n " ) ) ;
close ( fd ) ;
talloc_free ( client ) ;
return ;
2023-03-22 09:36:23 +01:00
}
2009-12-02 13:41:04 +11:00
client_pid - > ctdb = ctdb ;
2011-11-05 19:04:40 +01:00
client_pid - > pid = peer_pid ;
2009-12-02 13:41:04 +11:00
client_pid - > client = client ;
DLIST_ADD ( ctdb - > client_pids , client_pid ) ;
2007-04-10 06:03:39 +10:00
2023-03-22 09:36:23 +01:00
client - > queue = ctdb_queue_setup ( ctdb , client , fd , CTDB_DS_ALIGNMENT ,
2010-07-01 23:08:49 +10:00
ctdb_daemon_read_cb , client ,
" client-%u " , client - > pid ) ;
2007-04-10 06:03:39 +10:00
talloc_set_destructor ( client , ctdb_client_destructor ) ;
2009-12-02 13:41:04 +11:00
talloc_set_destructor ( client_pid , ctdb_clientpid_destructor ) ;
2013-04-19 13:29:04 +10:00
ctdb - > num_clients + + ;
2007-04-10 06:03:39 +10:00
}
/*
2020-10-24 20:29:58 +11:00
* Create a unix domain socket , bind it , secure it and listen . Return
* the file descriptor for the socket .
*/
2020-10-24 20:35:53 +11:00
static int ux_socket_bind ( struct ctdb_context * ctdb , bool test_mode_enabled )
2007-04-10 06:03:39 +10:00
{
2020-01-17 11:28:31 +01:00
struct sockaddr_un addr = { . sun_family = AF_UNIX } ;
2016-08-10 17:16:34 +10:00
int ret ;
2007-04-10 06:03:39 +10:00
ctdb - > daemon . sd = socket ( AF_UNIX , SOCK_STREAM , 0 ) ;
if ( ctdb - > daemon . sd = = - 1 ) {
return - 1 ;
}
2013-11-11 12:39:27 +11:00
strncpy ( addr . sun_path , ctdb - > daemon . name , sizeof ( addr . sun_path ) - 1 ) ;
2007-04-10 06:03:39 +10:00
2017-01-30 14:34:12 +11:00
if ( ! sock_clean ( ctdb - > daemon . name ) ) {
2016-09-22 14:52:55 +10:00
return - 1 ;
}
2013-07-19 15:36:29 +10:00
set_close_on_exec ( ctdb - > daemon . sd ) ;
2016-08-10 17:16:34 +10:00
ret = set_blocking ( ctdb - > daemon . sd , false ) ;
if ( ret ! = 0 ) {
2020-10-24 20:29:58 +11:00
DBG_ERR ( " Failed to set socket non-blocking (%s) \n " ,
strerror ( errno ) ) ;
2016-08-10 17:16:34 +10:00
goto failed ;
}
2013-07-19 15:36:29 +10:00
2020-10-24 20:29:58 +11:00
ret = bind ( ctdb - > daemon . sd , ( struct sockaddr * ) & addr , sizeof ( addr ) ) ;
if ( ret = = - 1 ) {
D_ERR ( " Unable to bind on ctdb socket '%s' \n " , ctdb - > daemon . name ) ;
2007-05-13 09:20:16 +10:00
goto failed ;
2013-07-19 15:36:29 +10:00
}
2008-04-10 06:51:53 +10:00
2020-10-24 20:35:53 +11:00
if ( ! test_mode_enabled ) {
ret = chown ( ctdb - > daemon . name , geteuid ( ) , getegid ( ) ) ;
if ( ret ! = 0 & & ! test_mode_enabled ) {
D_ERR ( " Unable to secure (chown) ctdb socket '%s' \n " ,
ctdb - > daemon . name ) ;
goto failed ;
}
2020-10-24 20:29:58 +11:00
}
ret = chmod ( ctdb - > daemon . name , 0700 ) ;
if ( ret ! = 0 ) {
D_ERR ( " Unable to secure (chmod) ctdb socket '%s' \n " ,
ctdb - > daemon . name ) ;
2008-04-10 06:51:53 +10:00
goto failed ;
2013-07-19 15:36:29 +10:00
}
2008-04-10 06:51:53 +10:00
2020-10-24 20:29:58 +11:00
ret = listen ( ctdb - > daemon . sd , 100 ) ;
if ( ret ! = 0 ) {
D_ERR ( " Unable to listen on ctdb socket '%s' \n " ,
ctdb - > daemon . name ) ;
2007-05-13 09:20:16 +10:00
goto failed ;
}
2007-04-10 06:03:39 +10:00
2020-10-24 20:29:58 +11:00
D_NOTICE ( " Listening to ctdb socket %s \n " , ctdb - > daemon . name ) ;
2007-04-10 06:03:39 +10:00
return 0 ;
2007-05-13 09:20:16 +10:00
failed :
close ( ctdb - > daemon . sd ) ;
ctdb - > daemon . sd = - 1 ;
2020-10-24 20:29:58 +11:00
return - 1 ;
2007-04-10 06:03:39 +10:00
}
2021-07-09 14:01:33 +10:00
struct ctdb_node * ctdb_find_node ( struct ctdb_context * ctdb , uint32_t pnn )
2012-12-04 14:28:06 +11:00
{
2021-07-28 10:27:42 +10:00
struct ctdb_node * node = NULL ;
2019-06-22 06:23:12 +10:00
unsigned int i ;
2021-07-09 14:01:33 +10:00
if ( pnn = = CTDB_CURRENT_NODE ) {
pnn = ctdb - > pnn ;
}
2019-06-22 06:23:12 +10:00
/* Always found: PNN correctly set just before this is called */
for ( i = 0 ; i < ctdb - > num_nodes ; i + + ) {
2021-07-28 10:27:42 +10:00
node = ctdb - > nodes [ i ] ;
2021-07-09 14:01:33 +10:00
if ( pnn = = node - > pnn ) {
return node ;
2019-06-22 06:23:12 +10:00
}
2012-12-04 14:28:06 +11:00
}
2021-07-09 14:01:33 +10:00
return NULL ;
}
static void initialise_node_flags ( struct ctdb_context * ctdb )
{
struct ctdb_node * node = NULL ;
node = ctdb_find_node ( ctdb , CTDB_CURRENT_NODE ) ;
/*
* PNN correctly set just before this is called so always
* found but keep static analysers happy . . .
*/
if ( node = = NULL ) {
DBG_ERR ( " Unable to find current node \n " ) ;
return ;
}
2021-07-28 10:27:42 +10:00
node - > flags & = ~ NODE_FLAGS_DISCONNECTED ;
2012-12-04 14:28:06 +11:00
/* do we start out in DISABLED mode? */
if ( ctdb - > start_as_disabled ! = 0 ) {
2019-06-22 06:23:12 +10:00
D_ERR ( " This node is configured to start in DISABLED state \n " ) ;
2021-07-09 14:02:28 +10:00
node - > flags | = NODE_FLAGS_PERMANENTLY_DISABLED ;
2012-12-04 14:28:06 +11:00
}
/* do we start out in STOPPED mode? */
if ( ctdb - > start_as_stopped ! = 0 ) {
2019-06-22 06:23:12 +10:00
D_ERR ( " This node is configured to start in STOPPED state \n " ) ;
2021-07-28 10:27:42 +10:00
node - > flags | = NODE_FLAGS_STOPPED ;
2012-12-04 14:28:06 +11:00
}
}
2010-02-12 11:24:08 +01:00
static void ctdb_setup_event_callback ( struct ctdb_context * ctdb , int status ,
void * private_data )
{
if ( status ! = 0 ) {
2013-06-30 17:48:01 +10:00
ctdb_die ( ctdb , " Failed to run setup event " ) ;
2010-02-12 11:24:08 +01:00
}
ctdb_run_notification_script ( ctdb , " setup " ) ;
2013-01-10 16:33:36 +11:00
/* Start the recovery daemon */
if ( ctdb_start_recoverd ( ctdb ) ! = 0 ) {
DEBUG ( DEBUG_ALERT , ( " Failed to start recovery daemon \n " ) ) ;
exit ( 11 ) ;
}
ctdb_start_periodic_events ( ctdb ) ;
2013-12-18 15:37:11 +11:00
ctdb_wait_for_first_recovery ( ctdb ) ;
2010-02-12 11:24:08 +01:00
}
2012-06-07 15:08:15 +10:00
static struct timeval tevent_before_wait_ts ;
static struct timeval tevent_after_wait_ts ;
2015-03-27 16:23:48 +11:00
static void ctdb_tevent_trace_init ( void )
{
struct timeval now ;
now = timeval_current ( ) ;
tevent_before_wait_ts = now ;
tevent_after_wait_ts = now ;
}
2012-06-07 15:08:15 +10:00
static void ctdb_tevent_trace ( enum tevent_trace_point tp ,
void * private_data )
{
struct timeval diff ;
struct timeval now ;
2014-07-03 12:29:46 +10:00
struct ctdb_context * ctdb =
talloc_get_type ( private_data , struct ctdb_context ) ;
2012-06-07 15:08:15 +10:00
2014-07-03 12:29:46 +10:00
if ( getpid ( ) ! = ctdb - > ctdbd_pid ) {
2012-06-07 15:08:15 +10:00
return ;
}
now = timeval_current ( ) ;
switch ( tp ) {
case TEVENT_TRACE_BEFORE_WAIT :
2024-03-13 16:07:00 +01:00
diff = tevent_timeval_until ( & tevent_after_wait_ts , & now ) ;
2015-03-27 16:23:48 +11:00
if ( diff . tv_sec > 3 ) {
DEBUG ( DEBUG_ERR ,
( " Handling event took %ld seconds! \n " ,
2016-10-17 11:27:17 +02:00
( long ) diff . tv_sec ) ) ;
2012-06-07 15:08:15 +10:00
}
tevent_before_wait_ts = now ;
break ;
case TEVENT_TRACE_AFTER_WAIT :
2024-03-13 16:07:00 +01:00
diff = tevent_timeval_until ( & tevent_before_wait_ts , & now ) ;
2015-03-27 16:23:48 +11:00
if ( diff . tv_sec > 3 ) {
DEBUG ( DEBUG_ERR ,
( " No event for %ld seconds! \n " ,
2016-10-17 11:27:17 +02:00
( long ) diff . tv_sec ) ) ;
2012-06-07 15:08:15 +10:00
}
tevent_after_wait_ts = now ;
break ;
default :
/* Do nothing for future tevent trace points */ ;
}
}
2013-04-15 13:32:57 +10:00
static void ctdb_remove_pidfile ( void )
{
2016-09-22 14:35:03 +10:00
TALLOC_FREE ( ctdbd_pidfile_ctx ) ;
2013-04-15 13:32:57 +10:00
}
2016-09-22 14:35:03 +10:00
static void ctdb_create_pidfile ( TALLOC_CTX * mem_ctx )
2013-04-15 13:32:57 +10:00
{
if ( ctdbd_pidfile ! = NULL ) {
2017-07-31 15:16:45 +10:00
int ret = pidfile_context_create ( mem_ctx , ctdbd_pidfile ,
& ctdbd_pidfile_ctx ) ;
2016-09-22 14:35:03 +10:00
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR ,
( " Failed to create PID file %s \n " ,
ctdbd_pidfile ) ) ;
2013-04-15 13:32:57 +10:00
exit ( 11 ) ;
}
2013-04-22 13:52:04 +10:00
DEBUG ( DEBUG_NOTICE , ( " Created PID file %s \n " , ctdbd_pidfile ) ) ;
2013-04-15 13:32:57 +10:00
atexit ( ctdb_remove_pidfile ) ;
}
}
2015-02-17 12:34:41 +11:00
static void ctdb_initialise_vnn_map ( struct ctdb_context * ctdb )
{
2019-06-08 06:38:56 +10:00
unsigned int i , j , count ;
2015-02-17 12:34:41 +11:00
/* initialize the vnn mapping table, skipping any deleted nodes */
ctdb - > vnn_map = talloc ( ctdb , struct ctdb_vnn_map ) ;
CTDB_NO_MEMORY_FATAL ( ctdb , ctdb - > vnn_map ) ;
count = 0 ;
for ( i = 0 ; i < ctdb - > num_nodes ; i + + ) {
if ( ( ctdb - > nodes [ i ] - > flags & NODE_FLAGS_DELETED ) = = 0 ) {
count + + ;
}
}
ctdb - > vnn_map - > generation = INVALID_GENERATION ;
ctdb - > vnn_map - > size = count ;
ctdb - > vnn_map - > map = talloc_array ( ctdb - > vnn_map , uint32_t , ctdb - > vnn_map - > size ) ;
CTDB_NO_MEMORY_FATAL ( ctdb , ctdb - > vnn_map - > map ) ;
for ( i = 0 , j = 0 ; i < ctdb - > vnn_map - > size ; i + + ) {
if ( ctdb - > nodes [ i ] - > flags & NODE_FLAGS_DELETED ) {
continue ;
}
ctdb - > vnn_map - > map [ j ] = i ;
j + + ;
}
}
2015-02-17 15:21:15 +11:00
static void ctdb_set_my_pnn ( struct ctdb_context * ctdb )
{
2015-02-20 11:47:23 +11:00
if ( ctdb - > address = = NULL ) {
2015-02-17 15:21:15 +11:00
ctdb_fatal ( ctdb ,
" Can not determine PNN - node address is not set \n " ) ;
}
2019-06-22 05:53:15 +10:00
ctdb - > pnn = ctdb_ip_to_pnn ( ctdb , ctdb - > address ) ;
if ( ctdb - > pnn = = CTDB_UNKNOWN_PNN ) {
2015-02-17 15:21:15 +11:00
ctdb_fatal ( ctdb ,
2019-06-22 05:53:15 +10:00
" Can not determine PNN - unknown node address \n " ) ;
2015-02-17 15:21:15 +11:00
}
2019-06-22 05:53:15 +10:00
D_NOTICE ( " PNN is %u \n " , ctdb - > pnn ) ;
2015-02-17 15:21:15 +11:00
}
2020-01-13 21:04:54 +11:00
static void stdin_handler ( struct tevent_context * ev ,
struct tevent_fd * fde ,
uint16_t flags ,
void * private_data )
{
struct ctdb_context * ctdb = talloc_get_type_abort (
private_data , struct ctdb_context ) ;
ssize_t nread ;
char c ;
nread = read ( STDIN_FILENO , & c , 1 ) ;
if ( nread ! = 1 ) {
D_ERR ( " stdin closed, exiting \n " ) ;
talloc_free ( fde ) ;
ctdb_shutdown_sequence ( ctdb , EPIPE ) ;
}
}
static int setup_stdin_handler ( struct ctdb_context * ctdb )
{
struct tevent_fd * fde ;
struct stat st ;
int ret ;
ret = fstat ( STDIN_FILENO , & st ) ;
if ( ret ! = 0 ) {
/* Problem with stdin, ignore... */
DBG_INFO ( " Can't fstat() stdin \n " ) ;
return 0 ;
}
if ( ! S_ISFIFO ( st . st_mode ) ) {
DBG_INFO ( " Not a pipe... \n " ) ;
return 0 ;
}
fde = tevent_add_fd ( ctdb - > ev ,
ctdb ,
STDIN_FILENO ,
TEVENT_FD_READ ,
stdin_handler ,
ctdb ) ;
if ( fde = = NULL ) {
return ENOMEM ;
}
DBG_INFO ( " Set up stdin handler \n " ) ;
return 0 ;
}
2020-01-29 16:28:46 +11:00
static void fork_only ( void )
{
pid_t pid ;
pid = fork ( ) ;
if ( pid = = - 1 ) {
D_ERR ( " Fork failed (errno=%d) \n " , errno ) ;
exit ( 1 ) ;
}
if ( pid ! = 0 ) {
/* Parent simply exits... */
exit ( 0 ) ;
}
}
2021-09-30 21:08:25 +10:00
static void sighup_hook ( void * private_data )
{
struct ctdb_context * ctdb = talloc_get_type_abort ( private_data ,
struct ctdb_context ) ;
if ( ctdb - > recoverd_pid > 0 ) {
kill ( ctdb - > recoverd_pid , SIGHUP ) ;
}
2021-09-30 21:10:33 +10:00
ctdb_event_reopen_logs ( ctdb ) ;
2021-09-30 21:08:25 +10:00
}
2007-04-29 16:19:40 +02:00
/*
start the protocol going as a daemon
*/
2020-01-29 16:08:56 +11:00
int ctdb_start_daemon ( struct ctdb_context * ctdb ,
bool interactive ,
bool test_mode_enabled )
2007-04-29 16:19:40 +02:00
{
2021-09-30 21:06:16 +10:00
bool status ;
2020-10-24 21:54:21 +11:00
int ret ;
2015-10-26 16:50:09 +11:00
struct tevent_fd * fde ;
2007-04-29 16:19:40 +02:00
2020-01-29 16:28:46 +11:00
/* Fork if not interactive */
if ( ! interactive ) {
if ( test_mode_enabled ) {
/* Keep stdin open */
fork_only ( ) ;
} else {
/* Fork, close stdin, start a session */
become_daemon ( true , false , false ) ;
}
}
2007-04-29 16:19:40 +02:00
2014-06-06 14:58:17 +10:00
ignore_signal ( SIGPIPE ) ;
2015-07-21 12:23:27 +10:00
ignore_signal ( SIGUSR1 ) ;
2007-04-29 16:19:40 +02:00
2014-07-03 12:29:46 +10:00
ctdb - > ctdbd_pid = getpid ( ) ;
2013-05-22 15:37:46 +10:00
DEBUG ( DEBUG_ERR , ( " Starting CTDBD (Version %s) as PID: %u \n " ,
2019-03-15 12:14:27 +11:00
SAMBA_VERSION_STRING , ctdb - > ctdbd_pid ) ) ;
2016-09-22 14:35:03 +10:00
ctdb_create_pidfile ( ctdb ) ;
2009-10-27 13:18:52 +11:00
2016-09-22 14:43:58 +10:00
/* create a unix domain stream socket to listen to */
2020-10-24 20:35:53 +11:00
ret = ux_socket_bind ( ctdb , test_mode_enabled ) ;
2020-10-24 21:54:21 +11:00
if ( ret ! = 0 ) {
D_ERR ( " Cannot continue. Exiting! \n " ) ;
2016-09-22 14:43:58 +10:00
exit ( 10 ) ;
}
2013-07-17 11:14:37 +10:00
/* Make sure we log something when the daemon terminates.
* This must be the first exit handler to run ( so the last to
* be registered .
*/
2016-11-25 14:54:07 +11:00
__ctdbd_pid = getpid ( ) ;
2013-07-17 11:14:37 +10:00
atexit ( print_exit_message ) ;
2011-01-10 13:35:39 +11:00
if ( ctdb - > do_setsched ) {
/* try to set us up as realtime */
2014-09-12 11:22:36 +10:00
if ( ! set_scheduler ( ) ) {
exit ( 1 ) ;
}
DEBUG ( DEBUG_NOTICE , ( " Set real-time scheduler priority \n " ) ) ;
2011-01-10 13:35:39 +11:00
}
2007-05-24 14:52:10 +10:00
2015-10-26 16:50:09 +11:00
ctdb - > ev = tevent_context_init ( NULL ) ;
2016-07-27 11:45:49 +10:00
if ( ctdb - > ev = = NULL ) {
DEBUG ( DEBUG_ALERT , ( " tevent_context_init() failed \n " ) ) ;
exit ( 1 ) ;
}
2010-08-18 10:11:59 +10:00
tevent_loop_allow_nesting ( ctdb - > ev ) ;
2015-03-27 16:23:48 +11:00
ctdb_tevent_trace_init ( ) ;
2014-07-03 12:29:46 +10:00
tevent_set_trace_callback ( ctdb - > ev , ctdb_tevent_trace , ctdb ) ;
2007-05-09 09:59:23 +10:00
2021-09-30 21:06:16 +10:00
status = logging_setup_sighup_handler ( ctdb - > ev ,
ctdb ,
2021-09-30 21:08:25 +10:00
sighup_hook ,
ctdb ) ;
2021-09-30 21:06:16 +10:00
if ( ! status ) {
D_ERR ( " Failed to set up signal handler for SIGHUP \n " ) ;
exit ( 1 ) ;
}
2012-05-03 11:42:41 +10:00
/* set up a handler to pick up sigchld */
if ( ctdb_init_sigchld ( ctdb ) = = NULL ) {
DEBUG ( DEBUG_CRIT , ( " Failed to set up signal handler for SIGCHLD \n " ) ) ;
exit ( 1 ) ;
}
2020-01-29 16:26:03 +11:00
if ( ! interactive ) {
2016-11-29 17:52:00 +11:00
ctdb_set_child_logging ( ctdb ) ;
}
2008-01-16 22:03:01 +11:00
2020-01-13 21:04:54 +11:00
/* Exit if stdin is closed */
2020-01-29 16:26:03 +11:00
if ( test_mode_enabled ) {
2020-01-13 21:04:54 +11:00
ret = setup_stdin_handler ( ctdb ) ;
if ( ret ! = 0 ) {
DBG_ERR ( " Failed to setup stdin handler \n " ) ;
exit ( 1 ) ;
}
}
2016-04-05 17:11:17 +10:00
TALLOC_FREE ( ctdb - > srv ) ;
2015-04-08 14:38:26 +10:00
if ( srvid_init ( ctdb , & ctdb - > srv ) ! = 0 ) {
DEBUG ( DEBUG_CRIT , ( " Failed to setup message srvid context \n " ) ) ;
exit ( 1 ) ;
}
2017-04-06 19:03:51 +10:00
TALLOC_FREE ( ctdb - > tunnels ) ;
if ( srvid_init ( ctdb , & ctdb - > tunnels ) ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Failed to setup tunnels context \n " ) ) ;
exit ( 1 ) ;
}
2010-09-29 12:13:05 +10:00
/* initialize statistics collection */
ctdb_statistics_init ( ctdb ) ;
2007-09-21 12:24:02 +10:00
/* force initial recovery for election */
ctdb - > recovery_mode = CTDB_RECOVERY_ACTIVE ;
2016-09-16 20:06:07 +10:00
if ( ctdb_start_eventd ( ctdb ) ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Failed to start event daemon \n " ) ) ;
exit ( 1 ) ;
}
2013-06-16 19:49:02 +10:00
ctdb_set_runstate ( ctdb , CTDB_RUNSTATE_INIT ) ;
ret = ctdb_event_script ( ctdb , CTDB_EVENT_INIT ) ;
if ( ret ! = 0 ) {
2013-06-30 17:43:52 +10:00
ctdb_die ( ctdb , " Failed to run init event \n " ) ;
2013-06-16 19:49:02 +10:00
}
ctdb_run_notification_script ( ctdb , " init " ) ;
2007-09-21 12:24:02 +10:00
if ( strcmp ( ctdb - > transport , " tcp " ) = = 0 ) {
ret = ctdb_tcp_init ( ctdb ) ;
}
# ifdef USE_INFINIBAND
if ( strcmp ( ctdb - > transport , " ib " ) = = 0 ) {
ret = ctdb_ibw_init ( ctdb ) ;
}
# endif
if ( ret ! = 0 ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( " Failed to initialise transport '%s' \n " , ctdb - > transport ) ) ;
2007-09-21 12:24:02 +10:00
return - 1 ;
}
2008-05-11 14:28:33 +10:00
if ( ctdb - > methods = = NULL ) {
DEBUG ( DEBUG_ALERT , ( __location__ " Can not initialize transport. ctdb->methods is NULL \n " ) ) ;
ctdb_fatal ( ctdb , " transport is unavailable. can not initialize. " ) ;
}
2015-02-17 15:21:15 +11:00
/* Initialise the transport. This sets the node address if it
* was not set via the command - line . */
2007-09-21 12:24:02 +10:00
if ( ctdb - > methods - > initialise ( ctdb ) ! = 0 ) {
ctdb_fatal ( ctdb , " transport failed to initialise " ) ;
}
2012-12-04 14:28:06 +11:00
2015-02-17 15:21:15 +11:00
ctdb_set_my_pnn ( ctdb ) ;
2012-12-04 14:28:06 +11:00
initialise_node_flags ( ctdb ) ;
2018-03-06 11:30:07 +11:00
ret = ctdb_set_public_addresses ( ctdb , true ) ;
if ( ret = = - 1 ) {
D_ERR ( " Unable to setup public IP addresses \n " ) ;
exit ( 1 ) ;
2010-11-10 12:59:25 +11:00
}
2015-02-17 12:34:41 +11:00
ctdb_initialise_vnn_map ( ctdb ) ;
2007-09-21 12:24:02 +10:00
2009-11-29 12:39:23 +01:00
/* attach to existing databases */
if ( ctdb_attach_databases ( ctdb ) ! = 0 ) {
ctdb_fatal ( ctdb , " Failed to attach to databases \n " ) ;
2007-09-21 12:24:02 +10:00
}
2010-08-25 08:34:35 +10:00
/* start frozen, then let the first election sort things out */
2012-06-06 16:19:10 +10:00
if ( ! ctdb_blocking_freeze ( ctdb ) ) {
2010-08-25 08:34:35 +10:00
ctdb_fatal ( ctdb , " Failed to get initial freeze \n " ) ;
}
2007-05-23 12:23:07 +10:00
/* now start accepting clients, only can do this once frozen */
2015-10-26 16:50:09 +11:00
fde = tevent_add_fd ( ctdb - > ev , ctdb , ctdb - > daemon . sd , TEVENT_FD_READ ,
ctdb_accept_client , ctdb ) ;
2011-08-10 17:53:56 +02:00
if ( fde = = NULL ) {
ctdb_fatal ( ctdb , " Failed to add daemon socket to event loop " ) ;
}
2010-08-18 09:16:31 +09:30
tevent_fd_set_auto_close ( fde ) ;
2007-05-23 12:23:07 +10:00
2013-01-10 16:33:36 +11:00
/* Start the transport */
if ( ctdb - > methods - > start ( ctdb ) ! = 0 ) {
DEBUG ( DEBUG_ALERT , ( " transport failed to start! \n " ) ) ;
ctdb_fatal ( ctdb , " transport failed to start " ) ;
}
/* Recovery daemon and timed events are started from the
* callback , only after the setup event completes
* successfully .
*/
ctdb_set_runstate ( ctdb , CTDB_RUNSTATE_SETUP ) ;
2010-02-12 11:24:08 +01:00
ret = ctdb_event_script_callback ( ctdb ,
ctdb ,
ctdb_setup_event_callback ,
ctdb ,
CTDB_EVENT_SETUP ,
2011-11-05 17:26:40 +01:00
" %s " ,
2010-02-12 11:24:08 +01:00
" " ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_CRIT , ( " Failed to set up 'setup' event \n " ) ) ;
exit ( 1 ) ;
}
2014-06-10 17:00:38 +10:00
lockdown_memory ( ctdb - > valgrinding ) ;
2014-06-06 15:08:22 +10:00
2007-09-21 12:24:02 +10:00
/* go into a wait loop to allow other nodes to complete */
2015-10-26 16:50:09 +11:00
tevent_loop_wait ( ctdb - > ev ) ;
2007-09-21 12:24:02 +10:00
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_CRIT , ( " event_loop_wait() returned. this should not happen \n " ) ) ;
2007-09-21 12:24:02 +10:00
exit ( 1 ) ;
2007-04-29 16:19:40 +02:00
}
2007-04-28 10:50:32 +02:00
/*
allocate a packet for use in daemon < - > daemon communication
*/
struct ctdb_req_header * _ctdb_transport_allocate ( struct ctdb_context * ctdb ,
2023-03-22 09:36:23 +01:00
TALLOC_CTX * mem_ctx ,
enum ctdb_operation operation ,
2007-04-28 10:50:32 +02:00
size_t length , size_t slength ,
const char * type )
{
int size ;
struct ctdb_req_header * hdr ;
2007-05-03 13:44:27 +10:00
length = MAX ( length , slength ) ;
size = ( length + ( CTDB_DS_ALIGNMENT - 1 ) ) & ~ ( CTDB_DS_ALIGNMENT - 1 ) ;
2008-05-11 14:28:33 +10:00
if ( ctdb - > methods = = NULL ) {
2010-10-28 13:38:34 +11:00
DEBUG ( DEBUG_INFO , ( __location__ " Unable to allocate transport packet for operation %u of length %u. Transport is DOWN. \n " ,
2008-05-11 14:28:33 +10:00
operation , ( unsigned ) length ) ) ;
return NULL ;
}
2007-04-28 10:50:32 +02:00
hdr = ( struct ctdb_req_header * ) ctdb - > methods - > allocate_pkt ( mem_ctx , size ) ;
if ( hdr = = NULL ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( " Unable to allocate transport packet for operation %u of length %u \n " ,
2007-05-29 13:58:41 +10:00
operation , ( unsigned ) length ) ) ;
2007-04-28 10:50:32 +02:00
return NULL ;
}
talloc_set_name_const ( hdr , type ) ;
2007-05-03 13:44:27 +10:00
memset ( hdr , 0 , slength ) ;
hdr - > length = length ;
2007-04-28 10:50:32 +02:00
hdr - > operation = operation ;
hdr - > ctdb_magic = CTDB_MAGIC ;
2014-10-21 11:53:29 +11:00
hdr - > ctdb_version = CTDB_PROTOCOL ;
2007-04-28 10:50:32 +02:00
hdr - > generation = ctdb - > vnn_map - > generation ;
2007-09-04 10:06:36 +10:00
hdr - > srcnode = ctdb - > pnn ;
2007-04-28 10:50:32 +02:00
2023-03-22 09:36:23 +01:00
return hdr ;
2007-04-10 06:03:39 +10:00
}
2007-04-26 14:27:49 +02:00
struct daemon_control_state {
2007-05-18 23:48:29 +10:00
struct daemon_control_state * next , * prev ;
2007-04-26 14:27:49 +02:00
struct ctdb_client * client ;
2015-10-29 16:42:05 +11:00
struct ctdb_req_control_old * c ;
2007-04-26 19:27:07 +02:00
uint32_t reqid ;
2007-05-18 23:48:29 +10:00
struct ctdb_node * node ;
2007-04-26 14:27:49 +02:00
} ;
/*
callback when a control reply comes in
*/
static void daemon_control_callback ( struct ctdb_context * ctdb ,
2023-03-22 09:36:23 +01:00
int32_t status , TDB_DATA data ,
2007-05-12 21:25:26 +10:00
const char * errormsg ,
2007-04-26 14:27:49 +02:00
void * private_data )
{
2023-03-22 09:36:23 +01:00
struct daemon_control_state * state = talloc_get_type ( private_data ,
2007-04-26 14:27:49 +02:00
struct daemon_control_state ) ;
struct ctdb_client * client = state - > client ;
2015-10-29 16:44:08 +11:00
struct ctdb_reply_control_old * r ;
2007-04-26 14:27:49 +02:00
size_t len ;
2010-02-04 14:36:14 +11:00
int ret ;
2007-04-26 14:27:49 +02:00
/* construct a message to send to the client containing the data */
2015-10-29 16:44:08 +11:00
len = offsetof ( struct ctdb_reply_control_old , data ) + data . dsize ;
2007-05-12 21:25:26 +10:00
if ( errormsg ) {
len + = strlen ( errormsg ) ;
}
2023-03-22 09:36:23 +01:00
r = ctdbd_allocate_pkt ( ctdb , state , CTDB_REPLY_CONTROL , len ,
2015-10-29 16:44:08 +11:00
struct ctdb_reply_control_old ) ;
2007-04-28 10:50:32 +02:00
CTDB_NO_MEMORY_VOID ( ctdb , r ) ;
2007-04-26 14:27:49 +02:00
2007-04-26 19:27:07 +02:00
r - > hdr . reqid = state - > reqid ;
2007-04-26 14:27:49 +02:00
r - > status = status ;
r - > datalen = data . dsize ;
2007-05-12 21:25:26 +10:00
r - > errorlen = 0 ;
2007-04-26 14:27:49 +02:00
memcpy ( & r - > data [ 0 ] , data . dptr , data . dsize ) ;
2007-05-12 21:25:26 +10:00
if ( errormsg ) {
r - > errorlen = strlen ( errormsg ) ;
memcpy ( & r - > data [ r - > datalen ] , errormsg , r - > errorlen ) ;
}
2007-04-26 14:27:49 +02:00
2010-02-04 14:36:14 +11:00
ret = daemon_queue_send ( client , & r - > hdr ) ;
if ( ret ! = - 1 ) {
talloc_free ( state ) ;
}
2007-04-26 14:27:49 +02:00
}
2007-05-18 23:48:29 +10:00
/*
fail all pending controls to a disconnected node
*/
void ctdb_daemon_cancel_controls ( struct ctdb_context * ctdb , struct ctdb_node * node )
{
struct daemon_control_state * state ;
while ( ( state = node - > pending_controls ) ) {
DLIST_REMOVE ( node - > pending_controls , state ) ;
2023-03-22 09:36:23 +01:00
daemon_control_callback ( ctdb , ( uint32_t ) - 1 , tdb_null ,
2007-05-18 23:48:29 +10:00
" node is disconnected " , state ) ;
}
}
/*
destroy a daemon_control_state
*/
static int daemon_control_destructor ( struct daemon_control_state * state )
{
if ( state - > node ) {
DLIST_REMOVE ( state - > node - > pending_controls , state ) ;
}
return 0 ;
}
2007-04-26 14:27:49 +02:00
/*
this is called when the ctdb daemon received a ctdb request control
from a local client over the unix domain socket
*/
2023-03-22 09:36:23 +01:00
static void daemon_request_control_from_client ( struct ctdb_client * client ,
2015-10-29 16:42:05 +11:00
struct ctdb_req_control_old * c )
2007-04-26 14:27:49 +02:00
{
TDB_DATA data ;
int res ;
struct daemon_control_state * state ;
2007-06-02 10:03:28 +10:00
TALLOC_CTX * tmp_ctx = talloc_new ( client ) ;
2007-04-26 14:27:49 +02:00
2007-04-26 19:27:07 +02:00
if ( c - > hdr . destnode = = CTDB_CURRENT_NODE ) {
2007-09-04 10:06:36 +10:00
c - > hdr . destnode = client - > ctdb - > pnn ;
2007-04-26 19:27:07 +02:00
}
2007-04-26 14:27:49 +02:00
state = talloc ( client , struct daemon_control_state ) ;
CTDB_NO_MEMORY_VOID ( client - > ctdb , state ) ;
state - > client = client ;
state - > c = talloc_steal ( state , c ) ;
2007-04-26 19:27:07 +02:00
state - > reqid = c - > hdr . reqid ;
2007-09-04 10:09:58 +10:00
if ( ctdb_validate_pnn ( client - > ctdb , c - > hdr . destnode ) ) {
2007-05-18 23:48:29 +10:00
state - > node = client - > ctdb - > nodes [ c - > hdr . destnode ] ;
DLIST_ADD ( state - > node - > pending_controls , state ) ;
} else {
state - > node = NULL ;
}
talloc_set_destructor ( state , daemon_control_destructor ) ;
2007-06-02 10:03:28 +10:00
if ( c - > flags & CTDB_CTRL_FLAG_NOREPLY ) {
talloc_steal ( tmp_ctx , state ) ;
}
2023-03-22 09:36:23 +01:00
2007-04-26 14:27:49 +02:00
data . dptr = & c - > data [ 0 ] ;
data . dsize = c - > datalen ;
res = ctdb_daemon_send_control ( client - > ctdb , c - > hdr . destnode ,
2007-05-04 11:41:29 +10:00
c - > srvid , c - > opcode , client - > client_id ,
c - > flags ,
2007-04-30 15:31:40 +02:00
data , daemon_control_callback ,
2007-04-26 14:27:49 +02:00
state ) ;
if ( res ! = 0 ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Failed to send control to remote node %u \n " ,
2007-04-26 14:27:49 +02:00
c - > hdr . destnode ) ) ;
}
2007-05-18 23:48:29 +10:00
2007-06-02 10:03:28 +10:00
talloc_free ( tmp_ctx ) ;
2007-04-26 14:27:49 +02:00
}
2007-04-30 15:31:40 +02:00
2017-04-06 19:09:58 +10:00
static void daemon_request_tunnel_from_client ( struct ctdb_client * client ,
struct ctdb_req_tunnel_old * c )
{
TDB_DATA data ;
int ret ;
if ( ! ctdb_validate_pnn ( client - > ctdb , c - > hdr . destnode ) ) {
DEBUG ( DEBUG_ERR , ( " Invalid destination 0x%x \n " ,
c - > hdr . destnode ) ) ;
return ;
}
ret = srvid_exists ( client - > ctdb - > tunnels , c - > tunnel_id , NULL ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR ,
( " tunnel id 0x% " PRIx64 " not registered, dropping pkt \n " ,
c - > tunnel_id ) ) ;
return ;
}
data = ( TDB_DATA ) {
. dsize = c - > datalen ,
. dptr = & c - > data [ 0 ] ,
} ;
ret = ctdb_daemon_send_tunnel ( client - > ctdb , c - > hdr . destnode ,
c - > tunnel_id , c - > flags , data ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Failed to set tunnel to remote note %u \n " ,
c - > hdr . destnode ) ) ;
}
}
2007-04-30 15:31:40 +02:00
/*
register a call function
*/
int ctdb_daemon_set_call ( struct ctdb_context * ctdb , uint32_t db_id ,
ctdb_fn_t fn , int id )
{
struct ctdb_registered_call * call ;
struct ctdb_db_context * ctdb_db ;
ctdb_db = find_ctdb_db ( ctdb , db_id ) ;
if ( ctdb_db = = NULL ) {
return - 1 ;
}
call = talloc ( ctdb_db , struct ctdb_registered_call ) ;
call - > fn = fn ;
call - > id = id ;
2023-03-22 09:36:23 +01:00
DLIST_ADD ( ctdb_db - > calls , call ) ;
2007-04-30 15:31:40 +02:00
return 0 ;
}
2007-06-07 22:06:19 +10:00
/*
this local messaging handler is ugly , but is needed to prevent
recursion in ctdb_send_message ( ) when the destination node is the
same as the source node
*/
struct ctdb_local_message {
struct ctdb_context * ctdb ;
uint64_t srvid ;
TDB_DATA data ;
} ;
2015-10-26 16:50:09 +11:00
static void ctdb_local_message_trigger ( struct tevent_context * ev ,
struct tevent_timer * te ,
2007-06-07 22:06:19 +10:00
struct timeval t , void * private_data )
{
2015-04-08 14:38:26 +10:00
struct ctdb_local_message * m = talloc_get_type (
private_data , struct ctdb_local_message ) ;
2007-06-07 22:06:19 +10:00
2015-04-08 14:38:26 +10:00
srvid_dispatch ( m - > ctdb - > srv , m - > srvid , CTDB_SRVID_ALL , m - > data ) ;
2007-06-07 22:06:19 +10:00
talloc_free ( m ) ;
}
static int ctdb_local_message ( struct ctdb_context * ctdb , uint64_t srvid , TDB_DATA data )
{
struct ctdb_local_message * m ;
m = talloc ( ctdb , struct ctdb_local_message ) ;
CTDB_NO_MEMORY ( ctdb , m ) ;
m - > ctdb = ctdb ;
m - > srvid = srvid ;
m - > data = data ;
m - > data . dptr = talloc_memdup ( m , m - > data . dptr , m - > data . dsize ) ;
if ( m - > data . dptr = = NULL ) {
talloc_free ( m ) ;
return - 1 ;
}
/* this needs to be done as an event to prevent recursion */
2015-10-26 16:50:09 +11:00
tevent_add_timer ( ctdb - > ev , m , timeval_zero ( ) ,
ctdb_local_message_trigger , m ) ;
2007-06-07 22:06:19 +10:00
return 0 ;
}
/*
send a ctdb message
*/
2007-09-04 10:45:41 +10:00
int ctdb_daemon_send_message ( struct ctdb_context * ctdb , uint32_t pnn ,
2007-06-07 22:06:19 +10:00
uint64_t srvid , TDB_DATA data )
{
2015-10-29 16:36:30 +11:00
struct ctdb_req_message_old * r ;
2007-06-07 22:06:19 +10:00
int len ;
2009-06-30 12:09:28 +10:00
if ( ctdb - > methods = = NULL ) {
2010-10-28 13:38:34 +11:00
DEBUG ( DEBUG_INFO , ( __location__ " Failed to send message. Transport is DOWN \n " ) ) ;
2009-06-30 12:09:28 +10:00
return - 1 ;
}
2007-06-07 22:06:19 +10:00
/* see if this is a message to ourselves */
2007-09-04 10:45:41 +10:00
if ( pnn = = ctdb - > pnn ) {
2007-06-07 22:06:19 +10:00
return ctdb_local_message ( ctdb , srvid , data ) ;
}
2015-10-29 16:36:30 +11:00
len = offsetof ( struct ctdb_req_message_old , data ) + data . dsize ;
2007-06-07 22:06:19 +10:00
r = ctdb_transport_allocate ( ctdb , ctdb , CTDB_REQ_MESSAGE , len ,
2015-10-29 16:36:30 +11:00
struct ctdb_req_message_old ) ;
2007-06-07 22:06:19 +10:00
CTDB_NO_MEMORY ( ctdb , r ) ;
2007-09-04 10:45:41 +10:00
r - > hdr . destnode = pnn ;
2007-06-07 22:06:19 +10:00
r - > srvid = srvid ;
r - > datalen = data . dsize ;
memcpy ( & r - > data [ 0 ] , data . dptr , data . dsize ) ;
ctdb_queue_packet ( ctdb , & r - > hdr ) ;
talloc_free ( r ) ;
return 0 ;
}
2009-10-23 15:24:51 +11:00
struct ctdb_client_notify_list {
struct ctdb_client_notify_list * next , * prev ;
struct ctdb_context * ctdb ;
uint64_t srvid ;
TDB_DATA data ;
} ;
static int ctdb_client_notify_destructor ( struct ctdb_client_notify_list * nl )
{
int ret ;
DEBUG ( DEBUG_ERR , ( " Sending client notify message for srvid:%llu \n " , ( unsigned long long ) nl - > srvid ) ) ;
2024-02-29 15:33:56 +01:00
ret = ctdb_daemon_send_message ( nl - > ctdb ,
CTDB_BROADCAST_CONNECTED ,
nl - > srvid ,
nl - > data ) ;
2009-10-23 15:24:51 +11:00
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Failed to send client notify message \n " ) ) ;
}
return 0 ;
}
int32_t ctdb_control_register_notify ( struct ctdb_context * ctdb , uint32_t client_id , TDB_DATA indata )
{
2015-10-28 17:43:20 +11:00
struct ctdb_notify_data_old * notify = ( struct ctdb_notify_data_old * ) indata . dptr ;
2015-03-17 14:30:18 +11:00
struct ctdb_client * client = reqid_find ( ctdb - > idr , client_id , struct ctdb_client ) ;
2009-10-23 15:24:51 +11:00
struct ctdb_client_notify_list * nl ;
2010-03-30 11:57:25 +11:00
DEBUG ( DEBUG_INFO , ( " Register srvid %llu for client %d \n " , ( unsigned long long ) notify - > srvid , client_id ) ) ;
2009-10-23 15:24:51 +11:00
2015-10-28 17:43:20 +11:00
if ( indata . dsize < offsetof ( struct ctdb_notify_data_old , notify_data ) ) {
2009-10-23 15:24:51 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Too little data in control : %d \n " , ( int ) indata . dsize ) ) ;
return - 1 ;
}
2015-10-28 17:43:20 +11:00
if ( indata . dsize ! = ( notify - > len + offsetof ( struct ctdb_notify_data_old , notify_data ) ) ) {
DEBUG ( DEBUG_ERR , ( __location__ " Wrong amount of data in control. Got %d, expected %d \n " , ( int ) indata . dsize , ( int ) ( notify - > len + offsetof ( struct ctdb_notify_data_old , notify_data ) ) ) ) ;
2009-10-23 15:24:51 +11:00
return - 1 ;
}
if ( client = = NULL ) {
DEBUG ( DEBUG_ERR , ( __location__ " Could not find client parent structure. You can not send this control to a remote node \n " ) ) ;
return - 1 ;
}
for ( nl = client - > notify ; nl ; nl = nl - > next ) {
if ( nl - > srvid = = notify - > srvid ) {
break ;
}
}
if ( nl ! = NULL ) {
DEBUG ( DEBUG_ERR , ( __location__ " Notification for srvid:%llu already exists for this client \n " , ( unsigned long long ) notify - > srvid ) ) ;
return - 1 ;
}
nl = talloc ( client , struct ctdb_client_notify_list ) ;
CTDB_NO_MEMORY ( ctdb , nl ) ;
nl - > ctdb = ctdb ;
nl - > srvid = notify - > srvid ;
nl - > data . dsize = notify - > len ;
2016-04-04 16:23:09 +02:00
nl - > data . dptr = talloc_memdup ( nl , notify - > notify_data ,
nl - > data . dsize ) ;
2009-10-23 15:24:51 +11:00
CTDB_NO_MEMORY ( ctdb , nl - > data . dptr ) ;
2023-03-22 09:36:23 +01:00
2009-10-23 15:24:51 +11:00
DLIST_ADD ( client - > notify , nl ) ;
talloc_set_destructor ( nl , ctdb_client_notify_destructor ) ;
return 0 ;
}
int32_t ctdb_control_deregister_notify ( struct ctdb_context * ctdb , uint32_t client_id , TDB_DATA indata )
{
2015-10-28 17:47:03 +11:00
uint64_t srvid = * ( uint64_t * ) indata . dptr ;
2015-03-17 14:30:18 +11:00
struct ctdb_client * client = reqid_find ( ctdb - > idr , client_id , struct ctdb_client ) ;
2009-10-23 15:24:51 +11:00
struct ctdb_client_notify_list * nl ;
2015-10-28 17:47:03 +11:00
DEBUG ( DEBUG_INFO , ( " Deregister srvid %llu for client %d \n " , ( unsigned long long ) srvid , client_id ) ) ;
2009-10-23 15:24:51 +11:00
if ( client = = NULL ) {
DEBUG ( DEBUG_ERR , ( __location__ " Could not find client parent structure. You can not send this control to a remote node \n " ) ) ;
return - 1 ;
}
for ( nl = client - > notify ; nl ; nl = nl - > next ) {
2015-10-28 17:47:03 +11:00
if ( nl - > srvid = = srvid ) {
2009-10-23 15:24:51 +11:00
break ;
}
}
if ( nl = = NULL ) {
2015-10-28 17:47:03 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " No notification for srvid:%llu found for this client \n " , ( unsigned long long ) srvid ) ) ;
2009-10-23 15:24:51 +11:00
return - 1 ;
}
DLIST_REMOVE ( client - > notify , nl ) ;
talloc_set_destructor ( nl , NULL ) ;
talloc_free ( nl ) ;
return 0 ;
}
2009-12-02 13:17:12 +11:00
2009-12-02 13:58:27 +11:00
struct ctdb_client * ctdb_find_client_by_pid ( struct ctdb_context * ctdb , pid_t pid )
{
struct ctdb_client_pid_list * client_pid ;
for ( client_pid = ctdb - > client_pids ; client_pid ; client_pid = client_pid - > next ) {
if ( client_pid - > pid = = pid ) {
return client_pid - > client ;
}
}
return NULL ;
}
/* This control is used by samba when probing if a process (of a samba daemon)
exists on the node .
Samba does this when it needs / wants to check if a subrecord in one of the
2017-08-29 10:38:14 +02:00
databases is still valid , or if it is stale and can be removed .
2009-12-02 13:58:27 +11:00
If the node is in unhealthy or stopped state we just kill of the samba
2017-08-23 18:11:32 +02:00
process holding this sub - record and return to the calling samba that
2009-12-02 13:58:27 +11:00
the process does not exist .
This allows us to forcefully recall subrecords registered by samba processes
on banned and stopped nodes .
*/
int32_t ctdb_control_process_exists ( struct ctdb_context * ctdb , pid_t pid )
{
struct ctdb_client * client ;
2017-08-25 15:00:59 +10:00
client = ctdb_find_client_by_pid ( ctdb , pid ) ;
if ( client = = NULL ) {
return - 1 ;
}
if ( ctdb - > nodes [ ctdb - > pnn ] - > flags & NODE_FLAGS_INACTIVE ) {
DEBUG ( DEBUG_NOTICE ,
( " Killing client with pid:%d on banned/stopped node \n " ,
( int ) pid ) ) ;
talloc_free ( client ) ;
2009-12-02 13:58:27 +11:00
return - 1 ;
}
return kill ( pid , 0 ) ;
}
2013-06-19 10:58:14 +10:00
2017-08-30 16:18:02 +10:00
int32_t ctdb_control_check_pid_srvid ( struct ctdb_context * ctdb ,
TDB_DATA indata )
{
2017-09-22 13:52:09 +10:00
struct ctdb_client_pid_list * client_pid ;
2017-08-30 16:18:02 +10:00
pid_t pid ;
uint64_t srvid ;
int ret ;
pid = * ( pid_t * ) indata . dptr ;
srvid = * ( uint64_t * ) ( indata . dptr + sizeof ( pid_t ) ) ;
2017-09-22 13:52:09 +10:00
for ( client_pid = ctdb - > client_pids ;
client_pid ! = NULL ;
client_pid = client_pid - > next ) {
if ( client_pid - > pid = = pid ) {
ret = srvid_exists ( ctdb - > srv , srvid ,
client_pid - > client ) ;
if ( ret = = 0 ) {
return 0 ;
}
}
2017-08-30 16:18:02 +10:00
}
2017-09-22 13:52:09 +10:00
return - 1 ;
2017-08-30 16:18:02 +10:00
}
2015-02-20 21:19:01 +11:00
int ctdb_control_getnodesfile ( struct ctdb_context * ctdb , uint32_t opcode , TDB_DATA indata , TDB_DATA * outdata )
{
2015-10-29 17:22:48 +11:00
struct ctdb_node_map_old * node_map = NULL ;
2015-02-20 21:19:01 +11:00
CHECK_CONTROL_DATA_SIZE ( 0 ) ;
node_map = ctdb_read_nodes_file ( ctdb , ctdb - > nodes_file ) ;
if ( node_map = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Failed to read nodes file \n " ) ) ;
return - 1 ;
}
outdata - > dptr = ( unsigned char * ) node_map ;
outdata - > dsize = talloc_get_size ( outdata - > dptr ) ;
return 0 ;
}
2013-06-19 10:58:14 +10:00
void ctdb_shutdown_sequence ( struct ctdb_context * ctdb , int exit_code )
{
2013-06-22 15:44:28 +10:00
if ( ctdb - > runstate = = CTDB_RUNSTATE_SHUTDOWN ) {
DEBUG ( DEBUG_NOTICE , ( " Already shutting down so will not proceed. \n " ) ) ;
return ;
}
2017-07-04 15:49:54 +10:00
DEBUG ( DEBUG_ERR , ( " Shutdown sequence commencing. \n " ) ) ;
2013-06-19 10:58:14 +10:00
ctdb_set_runstate ( ctdb , CTDB_RUNSTATE_SHUTDOWN ) ;
ctdb_stop_recoverd ( ctdb ) ;
ctdb_stop_keepalive ( ctdb ) ;
2017-09-18 16:36:32 +10:00
ctdb_stop_monitoring ( ctdb ) ;
2013-06-19 10:58:14 +10:00
ctdb_event_script ( ctdb , CTDB_EVENT_SHUTDOWN ) ;
2016-09-16 20:06:07 +10:00
ctdb_stop_eventd ( ctdb ) ;
2016-06-27 18:00:49 +10:00
if ( ctdb - > methods ! = NULL & & ctdb - > methods - > shutdown ! = NULL ) {
2013-06-19 10:58:14 +10:00
ctdb - > methods - > shutdown ( ctdb ) ;
}
2017-07-04 15:49:54 +10:00
DEBUG ( DEBUG_ERR , ( " Shutdown sequence complete, exiting. \n " ) ) ;
2013-06-19 10:58:14 +10:00
exit ( exit_code ) ;
}
2015-11-11 14:18:51 +11:00
/* When forking the main daemon and the child process needs to connect
* back to the daemon as a client process , this function can be used
* to change the ctdb context from daemon into client mode . The child
* process must be created using ctdb_fork ( ) and not fork ( ) -
* ctdb_fork ( ) does some necessary housekeeping .
*/
2016-11-25 14:44:10 +11:00
int switch_from_server_to_client ( struct ctdb_context * ctdb )
2015-11-11 14:18:51 +11:00
{
int ret ;
2020-05-19 17:57:35 +10:00
if ( ctdb - > daemon . sd ! = - 1 ) {
close ( ctdb - > daemon . sd ) ;
ctdb - > daemon . sd = - 1 ;
}
2015-11-11 14:18:51 +11:00
/* get a new event context */
ctdb - > ev = tevent_context_init ( ctdb ) ;
2016-07-27 11:45:49 +10:00
if ( ctdb - > ev = = NULL ) {
DEBUG ( DEBUG_ALERT , ( " tevent_context_init() failed \n " ) ) ;
exit ( 1 ) ;
}
2015-11-11 14:18:51 +11:00
tevent_loop_allow_nesting ( ctdb - > ev ) ;
/* Connect to main CTDB daemon */
ret = ctdb_socket_connect ( ctdb ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ALERT , ( __location__ " Failed to init ctdb client \n " ) ) ;
return - 1 ;
}
ctdb - > can_send_controls = true ;
return 0 ;
}