2016-02-17 14:32:03 +11:00
/*
CTDB cluster mutex handling
Copyright ( C ) Andrew Tridgell 2007
Copyright ( C ) Ronnie Sahlberg 2007
Copyright ( C ) Martin Schwenke 2016
This program is free software ; you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation ; either version 3 of the License , or
( at your option ) any later version .
This program is distributed in the hope that it will be useful ,
but WITHOUT ANY WARRANTY ; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
You should have received a copy of the GNU General Public License
along with this program ; if not , see < http : //www.gnu.org/licenses/>.
*/
# include "replace.h"
# include "system/network.h"
2019-07-19 11:14:43 +10:00
# include "system/filesys.h"
2016-02-17 14:32:03 +11:00
2018-06-29 15:55:49 +10:00
# include <tevent.h>
2016-02-17 14:32:03 +11:00
# include "lib/util/debug.h"
# include "lib/util/time.h"
# include "lib/util/strv.h"
# include "lib/util/strv_util.h"
2016-11-29 12:55:06 +11:00
# include "lib/util/sys_rw.h"
2016-05-27 13:50:06 +10:00
# include "lib/util/blocking.h"
2016-02-17 14:32:03 +11:00
# include "ctdb_private.h"
# include "ctdb_cluster_mutex.h"
struct ctdb_cluster_mutex_handle {
struct ctdb_context * ctdb ;
cluster_mutex_handler_t handler ;
void * private_data ;
2016-06-01 19:05:47 +10:00
cluster_mutex_lost_handler_t lost_handler ;
void * lost_data ;
2016-02-17 14:32:03 +11:00
int fd [ 2 ] ;
struct tevent_timer * te ;
struct tevent_fd * fde ;
pid_t child ;
struct timeval start_time ;
2016-06-01 18:46:41 +10:00
bool have_response ;
2016-02-17 14:32:03 +11:00
} ;
static void cluster_mutex_timeout ( struct tevent_context * ev ,
struct tevent_timer * te ,
struct timeval t , void * private_data )
{
struct ctdb_cluster_mutex_handle * h =
talloc_get_type ( private_data , struct ctdb_cluster_mutex_handle ) ;
double latency = timeval_elapsed ( & h - > start_time ) ;
if ( h - > handler ! = NULL ) {
2016-06-01 17:10:26 +10:00
h - > handler ( ' 2 ' , latency , h - > private_data ) ;
2016-02-17 14:32:03 +11:00
}
}
/* When the handle is freed it causes any child holding the mutex to
* be killed , thus freeing the mutex */
static int cluster_mutex_destructor ( struct ctdb_cluster_mutex_handle * h )
{
if ( h - > fd [ 0 ] ! = - 1 ) {
h - > fd [ 0 ] = - 1 ;
}
ctdb_kill ( h - > ctdb , h - > child , SIGTERM ) ;
return 0 ;
}
/* this is called when the client process has completed ctdb_recovery_lock()
and has written data back to us through the pipe .
*/
static void cluster_mutex_handler ( struct tevent_context * ev ,
struct tevent_fd * fde ,
uint16_t flags , void * private_data )
{
struct ctdb_cluster_mutex_handle * h =
talloc_get_type ( private_data , struct ctdb_cluster_mutex_handle ) ;
double latency = timeval_elapsed ( & h - > start_time ) ;
char c = ' 0 ' ;
int ret ;
/* Got response from child process so abort timeout */
TALLOC_FREE ( h - > te ) ;
ret = sys_read ( h - > fd [ 0 ] , & c , 1 ) ;
2016-06-01 18:46:41 +10:00
/* Don't call the handler more than once. It only exists to
* process the initial response from the helper . */
if ( h - > have_response ) {
2016-06-01 19:05:47 +10:00
/* Only deal with EOF due to process exit. Silently
* ignore any other output . */
if ( ret = = 0 ) {
if ( h - > lost_handler ! = NULL ) {
h - > lost_handler ( h - > lost_data ) ;
}
}
2016-06-01 18:46:41 +10:00
return ;
}
h - > have_response = true ;
2016-02-17 14:32:03 +11:00
/* If the child wrote status then just pass it to the handler.
* If no status was written then this is an unexpected error
* so pass generic error code to handler . */
if ( h - > handler ! = NULL ) {
2016-06-01 17:10:26 +10:00
h - > handler ( ret = = 1 ? c : ' 3 ' , latency , h - > private_data ) ;
2016-02-17 14:32:03 +11:00
}
}
static char cluster_mutex_helper [ PATH_MAX + 1 ] = " " ;
2019-01-21 12:16:43 +11:00
static bool cluster_mutex_helper_args_file ( TALLOC_CTX * mem_ctx ,
const char * argstring ,
char * * * argv )
2016-02-17 14:32:03 +11:00
{
2019-07-19 11:14:43 +10:00
struct stat st ;
size_t size = sizeof ( cluster_mutex_helper ) ;
const char * t ;
2016-02-17 14:32:03 +11:00
char * * args = NULL ;
2019-07-19 11:14:43 +10:00
int ret ;
if ( cluster_mutex_helper [ 0 ] ! = ' \0 ' ) {
goto helper_done ;
}
t = getenv ( " CTDB_CLUSTER_MUTEX_HELPER " ) ;
if ( t ! = NULL ) {
size_t len ;
len = strlcpy ( cluster_mutex_helper , t , size ) ;
if ( len > = size ) {
DBG_ERR ( " error: CTDB_CLUSTER_MUTEX_HELPER too long \n " ) ;
exit ( 1 ) ;
}
} else {
ret = snprintf ( cluster_mutex_helper ,
size ,
" %s/%s " ,
CTDB_HELPER_BINDIR ,
" ctdb_mutex_fcntl_helper " ) ;
if ( ret < 0 | | ( size_t ) ret > = size ) {
D_ERR ( " Unable to set cluster mutex helper - "
" path too long \n " ) ;
exit ( 1 ) ;
}
}
ret = stat ( cluster_mutex_helper , & st ) ;
if ( ret ! = 0 ) {
D_ERR ( " Unable to set cluster mutex helper \" %s \" - %s \n " ,
cluster_mutex_helper ,
strerror ( errno ) ) ;
exit ( 1 ) ;
}
2016-02-17 14:32:03 +11:00
2019-07-19 11:14:43 +10:00
if ( ( st . st_mode & S_IXUSR ) = = 0 ) {
D_ERR ( " Unable to set cluster_mutex helper \" %s \" - "
" not executable \n " ,
cluster_mutex_helper ) ;
2019-01-21 12:16:43 +11:00
exit ( 1 ) ;
2016-02-17 14:32:03 +11:00
}
2019-07-19 11:14:43 +10:00
D_NOTICE ( " Set cluster mutex helper to \" %s \" \n " , cluster_mutex_helper ) ;
helper_done :
2019-01-21 12:16:43 +11:00
/* Array includes default helper, file and NULL */
args = talloc_array ( mem_ctx , char * , 3 ) ;
if ( args = = NULL ) {
DBG_ERR ( " Memory allocation error \n " ) ;
2016-02-17 14:32:03 +11:00
return false ;
}
2019-01-21 12:16:43 +11:00
args [ 0 ] = cluster_mutex_helper ;
2016-02-17 14:32:03 +11:00
2019-01-21 12:16:43 +11:00
args [ 1 ] = talloc_strdup ( args , argstring ) ;
if ( args [ 1 ] = = NULL ) {
DBG_ERR ( " Memory allocation error \n " ) ;
2016-02-17 14:32:03 +11:00
return false ;
}
2019-01-21 12:16:43 +11:00
args [ 2 ] = NULL ;
* argv = args ;
return true ;
}
2016-02-17 14:32:03 +11:00
2019-01-21 12:16:43 +11:00
static bool cluster_mutex_helper_args_cmd ( TALLOC_CTX * mem_ctx ,
const char * argstring ,
char * * * argv )
{
int i , ret , n ;
char * * args = NULL ;
char * strv = NULL ;
char * t = NULL ;
ret = strv_split ( mem_ctx , & strv , argstring , " \t " ) ;
if ( ret ! = 0 ) {
D_ERR ( " Unable to parse mutex helper command \" %s \" (%s) \n " ,
argstring ,
strerror ( ret ) ) ;
return false ;
2016-02-17 14:32:03 +11:00
}
2019-01-21 12:16:43 +11:00
n = strv_count ( strv ) ;
2019-06-08 06:56:00 +10:00
if ( n = = 0 ) {
D_ERR ( " Mutex helper command is empty \" %s \" \n " , argstring ) ;
return false ;
}
2019-01-21 12:16:43 +11:00
/* Extra slot for NULL */
args = talloc_array ( mem_ctx , char * , n + 1 ) ;
if ( args = = NULL ) {
DBG_ERR ( " Memory allocation error \n " ) ;
return false ;
}
talloc_steal ( args , strv ) ;
2016-02-17 14:32:03 +11:00
t = NULL ;
2019-01-21 12:16:43 +11:00
for ( i = 0 ; i < n ; i + + ) {
2016-02-17 14:32:03 +11:00
t = strv_next ( strv , t ) ;
2019-01-21 12:16:43 +11:00
args [ i ] = t ;
2016-02-17 14:32:03 +11:00
}
2019-01-21 12:16:43 +11:00
args [ n ] = NULL ;
2016-02-17 14:32:03 +11:00
* argv = args ;
return true ;
}
2019-01-21 12:16:43 +11:00
static bool cluster_mutex_helper_args ( TALLOC_CTX * mem_ctx ,
const char * argstring ,
char * * * argv )
{
bool ok ;
if ( argstring ! = NULL & & argstring [ 0 ] = = ' ! ' ) {
ok = cluster_mutex_helper_args_cmd ( mem_ctx , & argstring [ 1 ] , argv ) ;
} else {
ok = cluster_mutex_helper_args_file ( mem_ctx , argstring , argv ) ;
}
return ok ;
}
2016-02-17 14:32:03 +11:00
struct ctdb_cluster_mutex_handle *
2016-05-29 19:27:23 +10:00
ctdb_cluster_mutex ( TALLOC_CTX * mem_ctx ,
struct ctdb_context * ctdb ,
2016-02-17 14:32:03 +11:00
const char * argstring ,
2016-06-01 18:56:33 +10:00
int timeout ,
cluster_mutex_handler_t handler ,
2016-06-01 19:05:47 +10:00
void * private_data ,
cluster_mutex_lost_handler_t lost_handler ,
void * lost_data )
2016-02-17 14:32:03 +11:00
{
struct ctdb_cluster_mutex_handle * h ;
char * * args ;
2018-09-12 17:51:47 +10:00
sigset_t sigset_term ;
2016-02-17 14:32:03 +11:00
int ret ;
2016-05-29 19:27:23 +10:00
h = talloc ( mem_ctx , struct ctdb_cluster_mutex_handle ) ;
2016-02-17 14:32:03 +11:00
if ( h = = NULL ) {
2019-07-05 13:13:16 +10:00
DBG_ERR ( " out of memory \n " ) ;
2016-02-17 14:32:03 +11:00
return NULL ;
}
h - > start_time = timeval_current ( ) ;
h - > fd [ 0 ] = - 1 ;
h - > fd [ 1 ] = - 1 ;
2016-06-01 18:46:41 +10:00
h - > have_response = false ;
2016-02-17 14:32:03 +11:00
ret = pipe ( h - > fd ) ;
if ( ret ! = 0 ) {
talloc_free ( h ) ;
2019-07-05 13:13:16 +10:00
DBG_ERR ( " Failed to open pipe \n " ) ;
2016-02-17 14:32:03 +11:00
return NULL ;
}
set_close_on_exec ( h - > fd [ 0 ] ) ;
/* Create arguments for lock helper */
if ( ! cluster_mutex_helper_args ( h , argstring , & args ) ) {
close ( h - > fd [ 0 ] ) ;
close ( h - > fd [ 1 ] ) ;
talloc_free ( h ) ;
return NULL ;
}
2018-09-12 17:51:47 +10:00
sigemptyset ( & sigset_term ) ;
sigaddset ( & sigset_term , SIGTERM ) ;
ret = sigprocmask ( SIG_BLOCK , & sigset_term , NULL ) ;
if ( ret ! = 0 ) {
DBG_WARNING ( " Failed to block SIGTERM (%d) \n " , errno ) ;
}
2016-02-17 14:32:03 +11:00
h - > child = ctdb_fork ( ctdb ) ;
if ( h - > child = = ( pid_t ) - 1 ) {
close ( h - > fd [ 0 ] ) ;
close ( h - > fd [ 1 ] ) ;
talloc_free ( h ) ;
2018-09-12 17:51:47 +10:00
ret = sigprocmask ( SIG_UNBLOCK , & sigset_term , NULL ) ;
if ( ret ! = 0 ) {
DBG_WARNING ( " Failed to unblock SIGTERM (%d) \n " , errno ) ;
}
2016-02-17 14:32:03 +11:00
return NULL ;
}
if ( h - > child = = 0 ) {
2018-09-12 14:18:00 +10:00
struct sigaction sa = {
. sa_handler = SIG_DFL ,
} ;
ret = sigaction ( SIGTERM , & sa , NULL ) ;
if ( ret ! = 0 ) {
DBG_WARNING ( " Failed to reset signal handler (%d) \n " ,
errno ) ;
}
2018-09-12 17:51:47 +10:00
ret = sigprocmask ( SIG_UNBLOCK , & sigset_term , NULL ) ;
if ( ret ! = 0 ) {
DBG_WARNING ( " Failed to unblock SIGTERM (%d) \n " , errno ) ;
}
2016-02-17 14:32:03 +11:00
/* Make stdout point to the pipe */
close ( STDOUT_FILENO ) ;
dup2 ( h - > fd [ 1 ] , STDOUT_FILENO ) ;
close ( h - > fd [ 1 ] ) ;
execv ( args [ 0 ] , args ) ;
/* Only happens on error */
2019-07-05 13:13:16 +10:00
DBG_ERR ( " execv() failed \n " ) ;
2016-02-17 14:32:03 +11:00
_exit ( 1 ) ;
}
/* Parent */
2018-09-12 17:51:47 +10:00
ret = sigprocmask ( SIG_UNBLOCK , & sigset_term , NULL ) ;
if ( ret ! = 0 ) {
DBG_WARNING ( " Failed to unblock SIGTERM (%d) \n " , errno ) ;
}
2019-07-05 13:13:16 +10:00
DBG_DEBUG ( " Created PIPE FD:%d \n " , h - > fd [ 0 ] ) ;
2016-02-17 14:32:03 +11:00
set_close_on_exec ( h - > fd [ 0 ] ) ;
close ( h - > fd [ 1 ] ) ;
h - > fd [ 1 ] = - 1 ;
talloc_set_destructor ( h , cluster_mutex_destructor ) ;
if ( timeout ! = 0 ) {
h - > te = tevent_add_timer ( ctdb - > ev , h ,
timeval_current_ofs ( timeout , 0 ) ,
cluster_mutex_timeout , h ) ;
} else {
h - > te = NULL ;
}
h - > fde = tevent_add_fd ( ctdb - > ev , h , h - > fd [ 0 ] , TEVENT_FD_READ ,
cluster_mutex_handler , ( void * ) h ) ;
if ( h - > fde = = NULL ) {
talloc_free ( h ) ;
return NULL ;
}
tevent_fd_set_auto_close ( h - > fde ) ;
h - > ctdb = ctdb ;
2016-06-01 18:56:33 +10:00
h - > handler = handler ;
h - > private_data = private_data ;
2016-06-01 19:05:47 +10:00
h - > lost_handler = lost_handler ;
h - > lost_data = lost_data ;
2016-02-17 14:32:03 +11:00
return h ;
}