2007-05-12 15:15:27 +10:00
/*
ctdb freeze handling
Copyright ( C ) Andrew Tridgell 2007
2007-05-31 13:50:53 +10:00
This program is free software ; you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
2007-07-10 15:29:31 +10:00
the Free Software Foundation ; either version 3 of the License , or
2007-05-31 13:50:53 +10:00
( at your option ) any later version .
This program is distributed in the hope that it will be useful ,
2007-05-12 15:15:27 +10:00
but WITHOUT ANY WARRANTY ; without even the implied warranty of
2007-05-31 13:50:53 +10:00
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
You should have received a copy of the GNU General Public License
2007-07-10 15:29:31 +10:00
along with this program ; if not , see < http : //www.gnu.org/licenses/>.
2007-05-12 15:15:27 +10:00
*/
2015-10-26 16:50:46 +11:00
# include "replace.h"
2007-05-12 15:15:27 +10:00
# include "system/network.h"
# include "system/filesys.h"
# include "system/wait.h"
2015-10-26 16:50:46 +11:00
# include <talloc.h>
# include <tevent.h>
2014-08-15 15:46:33 +10:00
# include "lib/tdb_wrap/tdb_wrap.h"
2015-10-26 16:50:46 +11:00
# include "lib/util/dlinklist.h"
# include "lib/util/debug.h"
# include "ctdb_private.h"
# include "common/rb_tree.h"
2015-10-23 14:17:34 +11:00
# include "common/common.h"
2015-11-11 15:41:10 +11:00
# include "common/logging.h"
2014-08-05 16:23:21 +10:00
/**
* Cancel a transaction on database
*/
static int db_transaction_cancel_handler ( struct ctdb_db_context * ctdb_db ,
void * private_data )
{
int ret ;
tdb_add_flags ( ctdb_db - > ltdb - > tdb , TDB_NOLOCK ) ;
ret = tdb_transaction_cancel ( ctdb_db - > ltdb - > tdb ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Failed to cancel transaction for db %s \n " ,
ctdb_db - > db_name ) ) ;
}
tdb_remove_flags ( ctdb_db - > ltdb - > tdb , TDB_NOLOCK ) ;
return 0 ;
}
2014-08-05 17:02:28 +10:00
/**
* Start a transaction on database
*/
static int db_transaction_start_handler ( struct ctdb_db_context * ctdb_db ,
void * private_data )
{
bool freeze_transaction_started = * ( bool * ) private_data ;
int ret ;
tdb_add_flags ( ctdb_db - > ltdb - > tdb , TDB_NOLOCK ) ;
if ( freeze_transaction_started ) {
ret = tdb_transaction_cancel ( ctdb_db - > ltdb - > tdb ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR ,
( " Failed to cancel transaction for db %s \n " ,
ctdb_db - > db_name ) ) ;
}
}
ret = tdb_transaction_start ( ctdb_db - > ltdb - > tdb ) ;
tdb_remove_flags ( ctdb_db - > ltdb - > tdb , TDB_NOLOCK ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Failed to start transaction for db %s \n " ,
ctdb_db - > db_name ) ) ;
return - 1 ;
}
return 0 ;
}
2014-08-05 17:13:22 +10:00
/**
* Commit a transaction on database
*/
static int db_transaction_commit_handler ( struct ctdb_db_context * ctdb_db ,
void * private_data )
{
int healthy_nodes = * ( int * ) private_data ;
int ret ;
tdb_add_flags ( ctdb_db - > ltdb - > tdb , TDB_NOLOCK ) ;
ret = tdb_transaction_commit ( ctdb_db - > ltdb - > tdb ) ;
tdb_remove_flags ( ctdb_db - > ltdb - > tdb , TDB_NOLOCK ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Failed to commit transaction for db %s \n " ,
ctdb_db - > db_name ) ) ;
return - 1 ;
}
ret = ctdb_update_persistent_health ( ctdb_db - > ctdb , ctdb_db , NULL ,
healthy_nodes ) ;
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Failed to update persistent health for db %s \n " ,
ctdb_db - > db_name ) ) ;
}
return ret ;
}
2014-08-05 14:16:29 +10:00
/* a list of control requests waiting for db freeze */
struct ctdb_db_freeze_waiter {
struct ctdb_db_freeze_waiter * next , * prev ;
struct ctdb_context * ctdb ;
void * private_data ;
int32_t status ;
} ;
/* a handle to a db freeze lock child process */
struct ctdb_db_freeze_handle {
struct ctdb_db_context * ctdb_db ;
struct lock_request * lreq ;
struct ctdb_db_freeze_waiter * waiters ;
} ;
/**
* Called when freeing database freeze handle
*/
static int ctdb_db_freeze_handle_destructor ( struct ctdb_db_freeze_handle * h )
{
struct ctdb_db_context * ctdb_db = h - > ctdb_db ;
DEBUG ( DEBUG_ERR , ( " Release freeze handle for db %s \n " ,
ctdb_db - > db_name ) ) ;
/* Cancel any pending transactions */
if ( ctdb_db - > freeze_transaction_started ) {
db_transaction_cancel_handler ( ctdb_db , NULL ) ;
ctdb_db - > freeze_transaction_started = false ;
}
ctdb_db - > freeze_mode = CTDB_FREEZE_NONE ;
ctdb_db - > freeze_handle = NULL ;
talloc_free ( h - > lreq ) ;
return 0 ;
}
/**
* Called when a database is frozen
*/
static void ctdb_db_freeze_handler ( void * private_data , bool locked )
{
struct ctdb_db_freeze_handle * h = talloc_get_type_abort (
private_data , struct ctdb_db_freeze_handle ) ;
struct ctdb_db_freeze_waiter * w ;
if ( h - > ctdb_db - > freeze_mode = = CTDB_FREEZE_FROZEN ) {
DEBUG ( DEBUG_ERR , ( " Freeze db child died - unfreezing \n " ) ) ;
h - > ctdb_db - > freeze_mode = CTDB_FREEZE_NONE ;
talloc_free ( h ) ;
return ;
}
if ( ! locked ) {
DEBUG ( DEBUG_ERR , ( " Failed to get db lock for %s \n " ,
h - > ctdb_db - > db_name ) ) ;
h - > ctdb_db - > freeze_mode = CTDB_FREEZE_NONE ;
talloc_free ( h ) ;
return ;
}
h - > ctdb_db - > freeze_mode = CTDB_FREEZE_FROZEN ;
/* notify the waiters */
while ( ( w = h - > waiters ) ! = NULL ) {
w - > status = 0 ;
DLIST_REMOVE ( h - > waiters , w ) ;
talloc_free ( w ) ;
}
}
/**
* Start freeze process for a database
*/
static void ctdb_start_db_freeze ( struct ctdb_db_context * ctdb_db )
{
struct ctdb_db_freeze_handle * h ;
if ( ctdb_db - > freeze_mode = = CTDB_FREEZE_FROZEN ) {
return ;
}
if ( ctdb_db - > freeze_handle ! = NULL ) {
return ;
}
DEBUG ( DEBUG_ERR , ( " Freeze db: %s \n " , ctdb_db - > db_name ) ) ;
ctdb_stop_vacuuming ( ctdb_db - > ctdb ) ;
h = talloc_zero ( ctdb_db , struct ctdb_db_freeze_handle ) ;
CTDB_NO_MEMORY_FATAL ( ctdb_db - > ctdb , h ) ;
h - > ctdb_db = ctdb_db ;
h - > lreq = ctdb_lock_db ( h , ctdb_db , false , ctdb_db_freeze_handler , h ) ;
CTDB_NO_MEMORY_FATAL ( ctdb_db - > ctdb , h - > lreq ) ;
talloc_set_destructor ( h , ctdb_db_freeze_handle_destructor ) ;
ctdb_db - > freeze_handle = h ;
ctdb_db - > freeze_mode = CTDB_FREEZE_PENDING ;
}
/**
* Reply to a waiter for db freeze
*/
static int ctdb_db_freeze_waiter_destructor ( struct ctdb_db_freeze_waiter * w )
{
/* 'c' pointer is talloc_memdup(), so cannot use talloc_get_type */
2015-10-29 16:42:05 +11:00
struct ctdb_req_control_old * c =
( struct ctdb_req_control_old * ) w - > private_data ;
2014-08-05 14:16:29 +10:00
ctdb_request_control_reply ( w - > ctdb , c , NULL , w - > status , NULL ) ;
return 0 ;
}
/**
* freeze a database
*/
int32_t ctdb_control_db_freeze ( struct ctdb_context * ctdb ,
2015-10-29 16:42:05 +11:00
struct ctdb_req_control_old * c ,
2014-08-05 14:16:29 +10:00
uint32_t db_id ,
bool * async_reply )
{
struct ctdb_db_context * ctdb_db ;
struct ctdb_db_freeze_waiter * w ;
ctdb_db = find_ctdb_db ( ctdb , db_id ) ;
if ( ctdb_db = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Freeze db for unknown dbid 0x%08x \n " , db_id ) ) ;
return - 1 ;
}
if ( ctdb_db - > freeze_mode = = CTDB_FREEZE_FROZEN ) {
DEBUG ( DEBUG_ERR , ( " Freeze db: %s frozen \n " , ctdb_db - > db_name ) ) ;
return 0 ;
}
ctdb_start_db_freeze ( ctdb_db ) ;
/* add ourselves to the list of waiters */
w = talloc ( ctdb_db - > freeze_handle , struct ctdb_db_freeze_waiter ) ;
CTDB_NO_MEMORY ( ctdb , w ) ;
w - > ctdb = ctdb ;
w - > private_data = talloc_steal ( w , c ) ;
w - > status = - 1 ;
talloc_set_destructor ( w , ctdb_db_freeze_waiter_destructor ) ;
DLIST_ADD ( ctdb_db - > freeze_handle - > waiters , w ) ;
* async_reply = true ;
return 0 ;
}
/**
* Thaw a database
*/
int32_t ctdb_control_db_thaw ( struct ctdb_context * ctdb , uint32_t db_id )
{
struct ctdb_db_context * ctdb_db ;
ctdb_db = find_ctdb_db ( ctdb , db_id ) ;
if ( ctdb_db = = NULL ) {
DEBUG ( DEBUG_ERR , ( " Thaw db for unknown dbid 0x%08x \n " , db_id ) ) ;
return - 1 ;
}
2015-09-11 14:20:44 +10:00
DEBUG ( DEBUG_ERR , ( " Thaw db: %s generation %u \n " , ctdb_db - > db_name ,
ctdb_db - > generation ) ) ;
2014-08-05 14:16:29 +10:00
TALLOC_FREE ( ctdb_db - > freeze_handle ) ;
ctdb_call_resend_db ( ctdb_db ) ;
return 0 ;
}
2007-05-12 15:15:27 +10:00
/*
a list of control requests waiting for a freeze lock child to get
the database locks
*/
struct ctdb_freeze_waiter {
struct ctdb_freeze_waiter * next , * prev ;
struct ctdb_context * ctdb ;
2015-10-29 16:42:05 +11:00
struct ctdb_req_control_old * c ;
2009-10-12 12:08:39 +11:00
uint32_t priority ;
2007-05-12 15:15:27 +10:00
int32_t status ;
} ;
/* a handle to a freeze lock child process */
struct ctdb_freeze_handle {
struct ctdb_context * ctdb ;
2009-10-12 12:08:39 +11:00
uint32_t priority ;
2014-08-28 15:28:34 +10:00
unsigned int num_total , num_locked , num_failed ;
2007-05-12 15:15:27 +10:00
struct ctdb_freeze_waiter * waiters ;
} ;
2014-08-28 15:28:34 +10:00
static int db_thaw ( struct ctdb_db_context * ctdb_db , void * private_data )
{
talloc_free ( ctdb_db - > freeze_handle ) ;
return 0 ;
}
2007-05-12 15:15:27 +10:00
/*
destroy a freeze handle
2014-08-05 16:23:21 +10:00
*/
2007-05-12 15:15:27 +10:00
static int ctdb_freeze_handle_destructor ( struct ctdb_freeze_handle * h )
{
2008-07-07 08:50:12 +10:00
struct ctdb_context * ctdb = h - > ctdb ;
2015-09-15 16:13:10 +10:00
DEBUG ( DEBUG_ERR , ( " Release freeze handle for prio %u \n " , h - > priority ) ) ;
2009-10-12 12:08:39 +11:00
2008-07-07 08:50:12 +10:00
/* cancel any pending transactions */
2009-10-12 12:08:39 +11:00
if ( ctdb - > freeze_transaction_started ) {
2014-08-05 16:23:21 +10:00
ctdb_db_prio_iterator ( ctdb , h - > priority ,
db_transaction_cancel_handler , NULL ) ;
2009-10-12 12:08:39 +11:00
ctdb - > freeze_transaction_started = false ;
2008-07-07 08:50:12 +10:00
}
2014-08-28 15:28:34 +10:00
ctdb_db_prio_iterator ( ctdb , h - > priority , db_thaw , NULL ) ;
2009-10-12 12:08:39 +11:00
ctdb - > freeze_mode [ h - > priority ] = CTDB_FREEZE_NONE ;
ctdb - > freeze_handles [ h - > priority ] = NULL ;
2008-07-07 08:50:12 +10:00
2007-05-12 15:15:27 +10:00
return 0 ;
}
/*
called when the child writes its status to us
*/
2012-05-09 15:09:51 +10:00
static void ctdb_freeze_lock_handler ( void * private_data , bool locked )
2007-05-12 15:15:27 +10:00
{
2012-05-09 15:09:51 +10:00
struct ctdb_freeze_handle * h = talloc_get_type_abort ( private_data ,
struct ctdb_freeze_handle ) ;
2007-05-12 15:15:27 +10:00
struct ctdb_freeze_waiter * w ;
2009-10-12 12:08:39 +11:00
if ( h - > ctdb - > freeze_mode [ h - > priority ] = = CTDB_FREEZE_FROZEN ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_INFO , ( " freeze child died - unfreezing \n " ) ) ;
2007-05-12 15:59:49 +10:00
talloc_free ( h ) ;
return ;
}
2012-05-09 15:09:51 +10:00
if ( ! locked ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( " Failed to get locks in ctdb_freeze_child \n " ) ) ;
2007-05-12 15:15:27 +10:00
/* we didn't get the locks - destroy the handle */
talloc_free ( h ) ;
return ;
}
2009-10-12 12:08:39 +11:00
h - > ctdb - > freeze_mode [ h - > priority ] = CTDB_FREEZE_FROZEN ;
2007-05-12 15:15:27 +10:00
/* notify the waiters */
2009-10-22 13:41:28 +11:00
if ( h ! = h - > ctdb - > freeze_handles [ h - > priority ] ) {
DEBUG ( DEBUG_ERR , ( " lockwait finished but h is not linked \n " ) ) ;
}
while ( ( w = h - > waiters ) ) {
2012-05-09 15:09:51 +10:00
w - > status = 0 ;
2009-10-22 13:41:28 +11:00
DLIST_REMOVE ( h - > waiters , w ) ;
2007-05-12 15:15:27 +10:00
talloc_free ( w ) ;
}
}
2014-08-28 15:28:34 +10:00
/**
* When single database is frozen
*/
static int db_freeze_waiter_destructor ( struct ctdb_db_freeze_waiter * w )
{
struct ctdb_freeze_handle * h = talloc_get_type_abort (
w - > private_data , struct ctdb_freeze_handle ) ;
if ( w - > status = = 0 ) {
h - > num_locked + = 1 ;
} else {
h - > num_failed + = 1 ;
}
/* Call ctdb_freeze_lock_handler() only when the status of all
* databases is known .
*/
if ( h - > num_locked + h - > num_failed = = h - > num_total ) {
bool locked ;
if ( h - > num_locked = = h - > num_total ) {
locked = true ;
} else {
locked = false ;
}
ctdb_freeze_lock_handler ( h , locked ) ;
}
return 0 ;
}
/**
* Count the number of databases
*/
static int db_count ( struct ctdb_db_context * ctdb_db , void * private_data )
{
int * count = ( int * ) private_data ;
* count + = 1 ;
return 0 ;
}
/**
* Freeze a single database
*/
static int db_freeze ( struct ctdb_db_context * ctdb_db , void * private_data )
{
struct ctdb_freeze_handle * h = talloc_get_type_abort (
private_data , struct ctdb_freeze_handle ) ;
struct ctdb_db_freeze_waiter * w ;
ctdb_start_db_freeze ( ctdb_db ) ;
w = talloc ( ctdb_db - > freeze_handle , struct ctdb_db_freeze_waiter ) ;
CTDB_NO_MEMORY ( h - > ctdb , w ) ;
w - > ctdb = h - > ctdb ;
w - > private_data = h ;
w - > status = - 1 ;
talloc_set_destructor ( w , db_freeze_waiter_destructor ) ;
if ( ctdb_db - > freeze_mode = = CTDB_FREEZE_FROZEN ) {
/* Early return if already frozen */
w - > status = 0 ;
talloc_free ( w ) ;
return 0 ;
}
DLIST_ADD ( ctdb_db - > freeze_handle - > waiters , w ) ;
return 0 ;
}
2007-05-12 15:15:27 +10:00
/*
2009-10-12 12:08:39 +11:00
start the freeze process for a certain priority
2007-05-12 15:15:27 +10:00
*/
2015-09-16 18:23:23 +10:00
static void ctdb_start_freeze ( struct ctdb_context * ctdb , uint32_t priority )
2007-05-12 15:15:27 +10:00
{
2012-05-09 15:09:51 +10:00
struct ctdb_freeze_handle * h ;
2014-08-28 15:28:34 +10:00
int ret ;
2012-05-09 15:09:51 +10:00
2009-10-12 12:08:39 +11:00
if ( ( priority < 1 ) | | ( priority > NUM_DB_PRIORITIES ) ) {
DEBUG ( DEBUG_ERR , ( __location__ " Invalid db priority : %u \n " , priority ) ) ;
2013-07-01 16:21:00 +10:00
ctdb_fatal ( ctdb , " Internal error " ) ;
2009-10-12 12:08:39 +11:00
}
if ( ctdb - > freeze_mode [ priority ] = = CTDB_FREEZE_FROZEN ) {
2015-09-16 18:49:00 +10:00
int count = 0 ;
/*
* Check if all the databases are frozen
*
* It ' s possible that the databases can get attached after
* initial freeze . This typically happens during startup as
* CTDB will only attach persistent databases and go in to
* startup freeze . The recovery master during recovery will
* attach all the missing databases .
*/
h = ctdb - > freeze_handles [ priority ] ;
if ( h = = NULL ) {
ctdb - > freeze_mode [ priority ] = CTDB_FREEZE_NONE ;
return ;
}
ret = ctdb_db_prio_iterator ( ctdb , priority , db_count , & count ) ;
if ( ret ! = 0 ) {
TALLOC_FREE ( ctdb - > freeze_handles [ priority ] ) ;
ctdb - > freeze_mode [ priority ] = CTDB_FREEZE_NONE ;
return ;
}
if ( count ! = h - > num_total ) {
DEBUG ( DEBUG_ERR , ( " Freeze priority %u: incremental \n " ,
priority ) ) ;
h - > num_total = count ;
h - > num_locked = 0 ;
h - > num_failed = 0 ;
ctdb - > freeze_mode [ priority ] = CTDB_FREEZE_PENDING ;
ret = ctdb_db_prio_iterator ( ctdb , priority ,
db_freeze , h ) ;
if ( ret ! = 0 ) {
TALLOC_FREE ( ctdb - > freeze_handles [ priority ] ) ;
ctdb - > freeze_mode [ priority ] = CTDB_FREEZE_NONE ;
}
}
2013-07-01 16:28:04 +10:00
return ;
2007-05-12 15:15:27 +10:00
}
2014-08-05 15:35:57 +10:00
if ( ctdb - > freeze_handles [ priority ] ! = NULL ) {
/* already trying to freeze */
return ;
}
2013-07-01 13:26:33 +10:00
DEBUG ( DEBUG_ERR , ( " Freeze priority %u \n " , priority ) ) ;
2010-07-21 12:29:55 +09:30
/* Stop any vacuuming going on: we don't want to wait. */
ctdb_stop_vacuuming ( ctdb ) ;
2014-08-28 15:28:34 +10:00
/* create freeze lock children for each database */
2014-08-05 15:35:57 +10:00
h = talloc_zero ( ctdb , struct ctdb_freeze_handle ) ;
CTDB_NO_MEMORY_FATAL ( ctdb , h ) ;
h - > ctdb = ctdb ;
h - > priority = priority ;
talloc_set_destructor ( h , ctdb_freeze_handle_destructor ) ;
2015-09-16 18:49:00 +10:00
ctdb - > freeze_handles [ priority ] = h ;
2014-08-05 15:35:57 +10:00
2014-08-28 15:28:34 +10:00
ret = ctdb_db_prio_iterator ( ctdb , priority , db_count , & h - > num_total ) ;
if ( ret ! = 0 ) {
talloc_free ( h ) ;
return ;
}
2014-08-05 15:35:57 +10:00
ctdb - > freeze_mode [ priority ] = CTDB_FREEZE_PENDING ;
2014-08-28 15:28:34 +10:00
ret = ctdb_db_prio_iterator ( ctdb , priority , db_freeze , h ) ;
if ( ret ! = 0 ) {
talloc_free ( h ) ;
return ;
}
if ( h - > num_total = = 0 ) {
ctdb - > freeze_mode [ priority ] = CTDB_FREEZE_FROZEN ;
}
2007-06-10 08:46:33 +10:00
}
2014-08-28 15:30:39 +10:00
/*
destroy a waiter for a freeze mode change
*/
static int ctdb_freeze_waiter_destructor ( struct ctdb_freeze_waiter * w )
{
ctdb_request_control_reply ( w - > ctdb , w - > c , NULL , w - > status , NULL ) ;
return 0 ;
}
2007-06-10 08:46:33 +10:00
/*
freeze the databases
*/
2015-10-29 16:42:05 +11:00
int32_t ctdb_control_freeze ( struct ctdb_context * ctdb , struct ctdb_req_control_old * c , bool * async_reply )
2007-06-10 08:46:33 +10:00
{
struct ctdb_freeze_waiter * w ;
2009-10-12 09:22:17 +11:00
uint32_t priority ;
priority = ( uint32_t ) c - > srvid ;
2007-06-10 08:46:33 +10:00
2009-10-14 10:14:03 +11:00
if ( priority = = 0 ) {
DEBUG ( DEBUG_ERR , ( " Freeze priority 0 requested, remapping to priority 1 \n " ) ) ;
priority = 1 ;
}
2009-10-12 12:08:39 +11:00
if ( ( priority < 1 ) | | ( priority > NUM_DB_PRIORITIES ) ) {
DEBUG ( DEBUG_ERR , ( __location__ " Invalid db priority : %u \n " , priority ) ) ;
return - 1 ;
}
2015-09-16 18:49:00 +10:00
ctdb_start_freeze ( ctdb , priority ) ;
2009-10-12 12:08:39 +11:00
if ( ctdb - > freeze_mode [ priority ] = = CTDB_FREEZE_FROZEN ) {
2014-08-28 16:58:56 +10:00
DEBUG ( DEBUG_ERR , ( " Freeze priority %u: frozen \n " , priority ) ) ;
2007-06-10 08:46:33 +10:00
/* we're already frozen */
return 0 ;
}
2009-10-22 13:41:28 +11:00
if ( ctdb - > freeze_handles [ priority ] = = NULL ) {
DEBUG ( DEBUG_ERR , ( " No freeze lock handle when adding a waiter \n " ) ) ;
return - 1 ;
}
2014-08-28 15:28:34 +10:00
/* If there are no databases, we are done. */
if ( ctdb - > freeze_handles [ priority ] - > num_total = = 0 ) {
return 0 ;
}
/* add ourselves to list of waiters */
2009-10-12 12:08:39 +11:00
w = talloc ( ctdb - > freeze_handles [ priority ] , struct ctdb_freeze_waiter ) ;
2007-05-12 15:15:27 +10:00
CTDB_NO_MEMORY ( ctdb , w ) ;
2009-10-12 12:08:39 +11:00
w - > ctdb = ctdb ;
w - > c = talloc_steal ( w , c ) ;
w - > priority = priority ;
w - > status = - 1 ;
2007-05-12 15:15:27 +10:00
talloc_set_destructor ( w , ctdb_freeze_waiter_destructor ) ;
2009-10-12 12:08:39 +11:00
DLIST_ADD ( ctdb - > freeze_handles [ priority ] - > waiters , w ) ;
2007-05-12 15:15:27 +10:00
/* we won't reply till later */
2012-05-17 16:08:37 +10:00
* async_reply = true ;
2007-05-12 15:15:27 +10:00
return 0 ;
}
2015-09-17 12:57:51 +10:00
static int db_freeze_block ( struct ctdb_db_context * ctdb_db , void * private_data )
{
struct tevent_context * ev = ( struct tevent_context * ) private_data ;
ctdb_start_db_freeze ( ctdb_db ) ;
while ( ctdb_db - > freeze_mode = = CTDB_FREEZE_PENDING ) {
tevent_loop_once ( ev ) ;
}
if ( ctdb_db - > freeze_mode ! = CTDB_FREEZE_FROZEN ) {
return - 1 ;
}
return 0 ;
}
2007-05-23 12:23:07 +10:00
/*
block until we are frozen , used during daemon startup
*/
bool ctdb_blocking_freeze ( struct ctdb_context * ctdb )
{
2015-09-17 12:57:51 +10:00
int ret ;
2007-05-23 12:23:07 +10:00
2015-09-17 12:57:51 +10:00
ret = ctdb_db_iterator ( ctdb , db_freeze_block , ctdb - > ev ) ;
if ( ret ! = 0 ) {
return false ;
2007-05-23 12:23:07 +10:00
}
2012-06-06 16:19:10 +10:00
return true ;
2007-05-23 12:23:07 +10:00
}
2009-10-12 12:08:39 +11:00
static void thaw_priority ( struct ctdb_context * ctdb , uint32_t priority )
2007-05-12 15:15:27 +10:00
{
2009-10-12 12:08:39 +11:00
DEBUG ( DEBUG_ERR , ( " Thawing priority %u \n " , priority ) ) ;
2009-10-12 09:22:17 +11:00
2008-01-06 12:38:01 +11:00
/* cancel any pending transactions */
2009-10-12 12:08:39 +11:00
if ( ctdb - > freeze_transaction_started ) {
2014-08-05 16:23:21 +10:00
ctdb_db_prio_iterator ( ctdb , priority ,
db_transaction_cancel_handler , NULL ) ;
ctdb - > freeze_transaction_started = false ;
2008-01-06 12:38:01 +11:00
}
2014-08-28 15:28:34 +10:00
ctdb_db_prio_iterator ( ctdb , priority , db_thaw , NULL ) ;
2014-08-28 16:59:52 +10:00
TALLOC_FREE ( ctdb - > freeze_handles [ priority ] ) ;
2009-10-12 12:08:39 +11:00
}
/*
thaw the databases
*/
2014-05-06 14:20:44 +10:00
int32_t ctdb_control_thaw ( struct ctdb_context * ctdb , uint32_t priority ,
bool check_recmode )
2009-10-12 12:08:39 +11:00
{
if ( priority > NUM_DB_PRIORITIES ) {
2014-05-06 14:20:44 +10:00
DEBUG ( DEBUG_ERR , ( __location__ " Invalid db priority : %u \n " ,
priority ) ) ;
return - 1 ;
}
if ( check_recmode & & ctdb - > recovery_mode = = CTDB_RECOVERY_ACTIVE ) {
DEBUG ( DEBUG_ERR , ( " Failing to thaw databases while "
" recovery is active \n " ) ) ;
2009-10-12 12:08:39 +11:00
return - 1 ;
}
if ( priority = = 0 ) {
int i ;
for ( i = 1 ; i < = NUM_DB_PRIORITIES ; i + + ) {
thaw_priority ( ctdb , i ) ;
}
} else {
thaw_priority ( ctdb , priority ) ;
}
2008-01-06 12:38:01 +11:00
2007-05-19 00:56:49 +10:00
ctdb_call_resend_all ( ctdb ) ;
2007-05-12 15:15:27 +10:00
return 0 ;
}
2008-01-06 12:38:01 +11:00
2015-09-09 15:38:36 +10:00
/**
* Database transaction wrappers
*
* These functions are wrappers around transaction start / cancel / commit handlers .
*/
struct db_start_transaction_state {
uint32_t transaction_id ;
bool transaction_started ;
} ;
static int db_start_transaction ( struct ctdb_db_context * ctdb_db ,
void * private_data )
{
struct db_start_transaction_state * state =
( struct db_start_transaction_state * ) private_data ;
int ret ;
bool transaction_started ;
if ( ctdb_db - > freeze_mode ! = CTDB_FREEZE_FROZEN ) {
DEBUG ( DEBUG_ERR ,
( " Database %s not frozen, cannot start transaction \n " ,
ctdb_db - > db_name ) ) ;
return - 1 ;
}
transaction_started = state - > transaction_started &
ctdb_db - > freeze_transaction_started ;
ret = db_transaction_start_handler ( ctdb_db ,
& transaction_started ) ;
if ( ret ! = 0 ) {
return - 1 ;
}
ctdb_db - > freeze_transaction_started = true ;
ctdb_db - > freeze_transaction_id = state - > transaction_id ;
return 0 ;
}
static int db_cancel_transaction ( struct ctdb_db_context * ctdb_db ,
void * private_data )
{
int ret ;
ret = db_transaction_cancel_handler ( ctdb_db , private_data ) ;
if ( ret ! = 0 ) {
return ret ;
}
ctdb_db - > freeze_transaction_started = false ;
return 0 ;
}
struct db_commit_transaction_state {
uint32_t transaction_id ;
int healthy_nodes ;
} ;
static int db_commit_transaction ( struct ctdb_db_context * ctdb_db ,
void * private_data )
{
struct db_commit_transaction_state * state =
( struct db_commit_transaction_state * ) private_data ;
int ret ;
if ( ctdb_db - > freeze_mode ! = CTDB_FREEZE_FROZEN ) {
DEBUG ( DEBUG_ERR ,
( " Database %s not frozen, cannot commit transaction \n " ,
ctdb_db - > db_name ) ) ;
return - 1 ;
}
if ( ! ctdb_db - > freeze_transaction_started ) {
DEBUG ( DEBUG_ERR , ( " Transaction not started on %s \n " ,
ctdb_db - > db_name ) ) ;
return - 1 ;
}
if ( ctdb_db - > freeze_transaction_id ! = state - > transaction_id ) {
DEBUG ( DEBUG_ERR ,
( " Incorrect transaction commit id 0x%08x for %s \n " ,
state - > transaction_id , ctdb_db - > db_name ) ) ;
return - 1 ;
}
ret = db_transaction_commit_handler ( ctdb_db , & state - > healthy_nodes ) ;
if ( ret ! = 0 ) {
return - 1 ;
}
ctdb_db - > freeze_transaction_started = false ;
ctdb_db - > freeze_transaction_id = 0 ;
2015-09-11 14:20:44 +10:00
ctdb_db - > generation = state - > transaction_id ;
2015-09-09 15:38:36 +10:00
return 0 ;
}
/**
* Start a transaction on a database - used for db recovery
*/
int32_t ctdb_control_db_transaction_start ( struct ctdb_context * ctdb ,
TDB_DATA indata )
{
2015-10-28 19:22:23 +11:00
struct ctdb_transdb * w =
( struct ctdb_transdb * ) indata . dptr ;
2015-09-09 15:38:36 +10:00
struct ctdb_db_context * ctdb_db ;
struct db_start_transaction_state state ;
ctdb_db = find_ctdb_db ( ctdb , w - > db_id ) ;
if ( ctdb_db = = NULL ) {
DEBUG ( DEBUG_ERR ,
( " Transaction start for unknown dbid 0x%08x \n " ,
w - > db_id ) ) ;
return - 1 ;
}
2015-10-28 19:22:23 +11:00
state . transaction_id = w - > tid ;
2015-09-09 15:38:36 +10:00
state . transaction_started = true ;
return db_start_transaction ( ctdb_db , & state ) ;
}
/**
* Cancel a transaction on a database - used for db recovery
*/
int32_t ctdb_control_db_transaction_cancel ( struct ctdb_context * ctdb ,
TDB_DATA indata )
{
uint32_t db_id = * ( uint32_t * ) indata . dptr ;
struct ctdb_db_context * ctdb_db ;
ctdb_db = find_ctdb_db ( ctdb , db_id ) ;
if ( ctdb_db = = NULL ) {
DEBUG ( DEBUG_ERR ,
( " Transaction cancel for unknown dbid 0x%08x \n " , db_id ) ) ;
return - 1 ;
}
DEBUG ( DEBUG_ERR , ( " Recovery db transaction cancelled for %s \n " ,
ctdb_db - > db_name ) ) ;
return db_cancel_transaction ( ctdb_db , NULL ) ;
}
/**
* Commit a transaction on a database - used for db recovery
*/
int32_t ctdb_control_db_transaction_commit ( struct ctdb_context * ctdb ,
TDB_DATA indata )
{
2015-10-28 19:22:23 +11:00
struct ctdb_transdb * w =
( struct ctdb_transdb * ) indata . dptr ;
2015-09-09 15:38:36 +10:00
struct ctdb_db_context * ctdb_db ;
struct db_commit_transaction_state state ;
int healthy_nodes , i ;
ctdb_db = find_ctdb_db ( ctdb , w - > db_id ) ;
if ( ctdb_db = = NULL ) {
DEBUG ( DEBUG_ERR ,
( " Transaction commit for unknown dbid 0x%08x \n " ,
w - > db_id ) ) ;
return - 1 ;
}
healthy_nodes = 0 ;
for ( i = 0 ; i < ctdb - > num_nodes ; i + + ) {
if ( ctdb - > nodes [ i ] - > flags = = 0 ) {
healthy_nodes + = 1 ;
}
}
2015-10-28 19:22:23 +11:00
state . transaction_id = w - > tid ;
2015-09-09 15:38:36 +10:00
state . healthy_nodes = healthy_nodes ;
return db_commit_transaction ( ctdb_db , & state ) ;
}
2008-01-06 12:38:01 +11:00
/*
start a transaction on all databases - used for recovery
*/
2008-01-06 13:24:55 +11:00
int32_t ctdb_control_transaction_start ( struct ctdb_context * ctdb , uint32_t id )
2008-01-06 12:38:01 +11:00
{
2015-09-15 15:13:50 +10:00
struct db_start_transaction_state state ;
2014-08-21 12:32:02 +10:00
int ret ;
2008-01-06 12:38:01 +11:00
2014-08-21 12:32:02 +10:00
if ( ! ctdb_db_all_frozen ( ctdb ) ) {
DEBUG ( DEBUG_ERR , ( __location__
" failing transaction start while not frozen \n " ) ) ;
return - 1 ;
2008-01-06 12:38:01 +11:00
}
2015-09-15 15:13:50 +10:00
state . transaction_id = id ;
state . transaction_started = ctdb - > freeze_transaction_started ;
ret = ctdb_db_iterator ( ctdb , db_start_transaction , & state ) ;
2014-08-05 17:02:28 +10:00
if ( ret ! = 0 ) {
return - 1 ;
2008-01-06 12:38:01 +11:00
}
2009-10-12 12:08:39 +11:00
ctdb - > freeze_transaction_started = true ;
ctdb - > freeze_transaction_id = id ;
2008-01-06 12:38:01 +11:00
return 0 ;
}
2009-10-12 16:48:05 +11:00
/*
cancel a transaction for all databases - used for recovery
*/
int32_t ctdb_control_transaction_cancel ( struct ctdb_context * ctdb )
{
DEBUG ( DEBUG_ERR , ( __location__ " recovery transaction cancelled called \n " ) ) ;
2015-09-15 15:13:50 +10:00
ctdb_db_iterator ( ctdb , db_cancel_transaction , NULL ) ;
2009-10-12 16:48:05 +11:00
ctdb - > freeze_transaction_started = false ;
return 0 ;
}
2008-01-06 12:38:01 +11:00
/*
commit transactions on all databases
*/
2008-01-06 13:24:55 +11:00
int32_t ctdb_control_transaction_commit ( struct ctdb_context * ctdb , uint32_t id )
2008-01-06 12:38:01 +11:00
{
2015-09-15 15:13:50 +10:00
struct db_commit_transaction_state state ;
2009-10-12 12:08:39 +11:00
int i ;
2009-12-07 13:28:11 +01:00
int healthy_nodes = 0 ;
2014-08-05 17:13:22 +10:00
int ret ;
2009-12-07 13:28:11 +01:00
2014-08-21 12:32:02 +10:00
if ( ! ctdb_db_all_frozen ( ctdb ) ) {
DEBUG ( DEBUG_ERR , ( __location__
" failing transaction commit while not frozen \n " ) ) ;
return - 1 ;
2008-01-06 12:38:01 +11:00
}
2009-10-12 12:08:39 +11:00
if ( ! ctdb - > freeze_transaction_started ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " transaction not started \n " ) ) ;
2008-01-06 12:38:01 +11:00
return - 1 ;
}
2009-10-12 12:08:39 +11:00
if ( id ! = ctdb - > freeze_transaction_id ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " incorrect transaction id 0x%x in commit \n " , id ) ) ;
2008-01-06 13:24:55 +11:00
return - 1 ;
}
2009-12-07 13:28:11 +01:00
DEBUG ( DEBUG_DEBUG , ( __location__ " num_nodes[%d] \n " , ctdb - > num_nodes ) ) ;
for ( i = 0 ; i < ctdb - > num_nodes ; i + + ) {
DEBUG ( DEBUG_DEBUG , ( __location__ " node[%d].flags[0x%X] \n " ,
i , ctdb - > nodes [ i ] - > flags ) ) ;
if ( ctdb - > nodes [ i ] - > flags = = 0 ) {
healthy_nodes + + ;
}
}
DEBUG ( DEBUG_INFO , ( __location__ " healthy_nodes[%d] \n " , healthy_nodes ) ) ;
2015-09-15 15:13:50 +10:00
state . transaction_id = id ;
state . healthy_nodes = healthy_nodes ;
ret = ctdb_db_iterator ( ctdb , db_commit_transaction , & state ) ;
2014-08-05 17:13:22 +10:00
if ( ret ! = 0 ) {
DEBUG ( DEBUG_ERR , ( " Cancel all transactions \n " ) ) ;
goto fail ;
2008-01-06 12:38:01 +11:00
}
2009-10-12 12:08:39 +11:00
ctdb - > freeze_transaction_started = false ;
ctdb - > freeze_transaction_id = 0 ;
2008-01-06 12:38:01 +11:00
return 0 ;
2009-12-07 13:19:33 +01:00
fail :
/* cancel any pending transactions */
2015-09-15 15:13:50 +10:00
ctdb_db_iterator ( ctdb , db_cancel_transaction , NULL ) ;
2009-12-07 13:19:33 +01:00
ctdb - > freeze_transaction_started = false ;
return - 1 ;
2008-01-06 12:38:01 +11:00
}
/*
wipe a database - only possible when in a frozen transaction
*/
int32_t ctdb_control_wipe_database ( struct ctdb_context * ctdb , TDB_DATA indata )
{
2015-10-28 19:22:23 +11:00
struct ctdb_transdb w = * ( struct ctdb_transdb * ) indata . dptr ;
2008-01-06 12:38:01 +11:00
struct ctdb_db_context * ctdb_db ;
2009-10-12 12:08:39 +11:00
ctdb_db = find_ctdb_db ( ctdb , w . db_id ) ;
if ( ! ctdb_db ) {
DEBUG ( DEBUG_ERR , ( __location__ " Unknown db 0x%x \n " , w . db_id ) ) ;
2008-01-06 12:38:01 +11:00
return - 1 ;
}
2015-09-15 14:16:21 +10:00
if ( ctdb_db - > freeze_mode ! = CTDB_FREEZE_FROZEN ) {
2009-10-12 12:08:39 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Failed transaction_start while not frozen \n " ) ) ;
2008-01-06 12:38:01 +11:00
return - 1 ;
}
2015-09-15 14:16:21 +10:00
if ( ! ctdb_db - > freeze_transaction_started ) {
2009-10-12 12:08:39 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " transaction not started \n " ) ) ;
2008-01-06 13:24:55 +11:00
return - 1 ;
}
2015-10-28 19:22:23 +11:00
if ( w . tid ! = ctdb_db - > freeze_transaction_id ) {
DEBUG ( DEBUG_ERR , ( __location__ " incorrect transaction id 0x%x in commit \n " , w . tid ) ) ;
2008-01-06 12:38:01 +11:00
return - 1 ;
}
if ( tdb_wipe_all ( ctdb_db - > ltdb - > tdb ) ! = 0 ) {
2008-02-04 20:07:15 +11:00
DEBUG ( DEBUG_ERR , ( __location__ " Failed to wipe database for db '%s' \n " ,
2008-01-06 12:38:01 +11:00
ctdb_db - > db_name ) ) ;
return - 1 ;
}
2010-12-17 02:22:02 +01:00
if ( ! ctdb_db - > persistent ) {
talloc_free ( ctdb_db - > delete_queue ) ;
ctdb_db - > delete_queue = trbt_create ( ctdb_db , 0 ) ;
if ( ctdb_db - > delete_queue = = NULL ) {
DEBUG ( DEBUG_ERR , ( __location__ " Failed to re-create "
" the vacuum tree. \n " ) ) ;
return - 1 ;
}
}
2008-01-06 12:38:01 +11:00
return 0 ;
}
2014-08-21 12:26:58 +10:00
2014-08-05 14:16:29 +10:00
bool ctdb_db_frozen ( struct ctdb_db_context * ctdb_db )
{
if ( ctdb_db - > freeze_mode ! = CTDB_FREEZE_FROZEN ) {
return false ;
}
return true ;
}
2014-08-21 12:26:58 +10:00
bool ctdb_db_prio_frozen ( struct ctdb_context * ctdb , uint32_t priority )
{
if ( priority = = 0 ) {
priority = 1 ;
}
if ( priority > NUM_DB_PRIORITIES ) {
DEBUG ( DEBUG_ERR , ( " Invalid DB priority specified \n " ) ) ;
return false ;
}
if ( ctdb - > freeze_mode [ priority ] ! = CTDB_FREEZE_FROZEN ) {
return false ;
}
return true ;
}
bool ctdb_db_all_frozen ( struct ctdb_context * ctdb )
{
int i ;
for ( i = 1 ; i < = NUM_DB_PRIORITIES ; i + + ) {
if ( ctdb - > freeze_mode [ i ] ! = CTDB_FREEZE_FROZEN ) {
return false ;
}
}
return true ;
}