2004-06-24 12:02:38 +04:00
/*
* Copyright ( C ) 2002 - 2004 Sistina Software , Inc . All rights reserved .
2009-05-19 14:38:58 +04:00
* Copyright ( C ) 2004 - 2009 Red Hat , Inc . All rights reserved .
2004-06-24 12:02:38 +04:00
*
* This file is part of LVM2 .
*
* This copyrighted material is made available to anyone wishing to use ,
* modify , copy , or redistribute it subject to the terms and conditions
2007-08-21 00:55:30 +04:00
* of the GNU Lesser General Public License v .2 .1 .
2004-06-24 12:02:38 +04:00
*
2007-08-21 00:55:30 +04:00
* You should have received a copy of the GNU Lesser General Public License
2004-06-24 12:02:38 +04:00
* along with this program ; if not , write to the Free Software Foundation ,
* Inc . , 59 Temple Place , Suite 330 , Boston , MA 02111 - 1307 USA
*/
/*
* Locking functions for LVM .
* The main purpose of this part of the library is to serialise LVM
* management operations across a cluster .
*/
# include "lib.h"
# include "clvm.h"
# include "lvm-string.h"
# include "locking.h"
# include "locking_types.h"
2009-06-12 12:30:19 +04:00
# include "toolcontext.h"
2004-06-24 12:02:38 +04:00
2008-11-04 18:07:45 +03:00
# include <assert.h>
2004-06-24 12:02:38 +04:00
# include <stddef.h>
# include <sys/socket.h>
# include <sys/un.h>
# include <unistd.h>
# ifndef CLUSTER_LOCKING_INTERNAL
2007-08-22 18:38:18 +04:00
int lock_resource ( struct cmd_context * cmd , const char * resource , uint32_t flags ) ;
2009-05-21 07:04:52 +04:00
int query_resource ( const char * resource , int * mode ) ;
2004-06-24 12:02:38 +04:00
void locking_end ( void ) ;
int locking_init ( int type , struct config_tree * cf , uint32_t * flags ) ;
# endif
typedef struct lvm_response {
char node [ 255 ] ;
char * response ;
int status ;
int len ;
} lvm_response_t ;
/*
* This gets stuck at the start of memory we allocate so we
* can sanity - check it at deallocation time
*/
# define LVM_SIGNATURE 0x434C564D
/*
* NOTE : the LVMD uses the socket FD as the client ID , this means
* that any client that calls fork ( ) will inherit the context of
* it ' s parent .
*/
static int _clvmd_sock = - 1 ;
/* FIXME Install SIGPIPE handler? */
/* Open connection to the Cluster Manager daemon */
static int _open_local_sock ( void )
{
int local_socket ;
struct sockaddr_un sockaddr ;
/* Open local socket */
if ( ( local_socket = socket ( PF_UNIX , SOCK_STREAM , 0 ) ) < 0 ) {
log_error ( " Local socket creation failed: %s " , strerror ( errno ) ) ;
return - 1 ;
}
memset ( & sockaddr , 0 , sizeof ( sockaddr ) ) ;
memcpy ( sockaddr . sun_path , CLVMD_SOCKNAME , sizeof ( CLVMD_SOCKNAME ) ) ;
sockaddr . sun_family = AF_UNIX ;
if ( connect ( local_socket , ( struct sockaddr * ) & sockaddr ,
sizeof ( sockaddr ) ) ) {
int saved_errno = errno ;
log_error ( " connect() failed on local socket: %s " ,
strerror ( errno ) ) ;
if ( close ( local_socket ) )
stack ;
errno = saved_errno ;
return - 1 ;
}
return local_socket ;
}
/* Send a request and return the status */
static int _send_request ( char * inbuf , int inlen , char * * retbuf )
{
2006-12-01 02:11:42 +03:00
char outbuf [ PIPE_BUF ] __attribute ( ( aligned ( 8 ) ) ) ;
2004-06-24 12:02:38 +04:00
struct clvm_header * outheader = ( struct clvm_header * ) outbuf ;
int len ;
int off ;
int buflen ;
int err ;
/* Send it to CLVMD */
rewrite :
if ( ( err = write ( _clvmd_sock , inbuf , inlen ) ) ! = inlen ) {
2008-01-30 17:00:02 +03:00
if ( err = = - 1 & & errno = = EINTR )
goto rewrite ;
2004-06-24 12:02:38 +04:00
log_error ( " Error writing data to clvmd: %s " , strerror ( errno ) ) ;
return 0 ;
}
/* Get the response */
reread :
if ( ( len = read ( _clvmd_sock , outbuf , sizeof ( struct clvm_header ) ) ) < 0 ) {
2008-01-30 17:00:02 +03:00
if ( errno = = EINTR )
goto reread ;
2004-06-24 12:02:38 +04:00
log_error ( " Error reading data from clvmd: %s " , strerror ( errno ) ) ;
return 0 ;
}
if ( len = = 0 ) {
log_error ( " EOF reading CLVMD " ) ;
errno = ENOTCONN ;
return 0 ;
}
/* Allocate buffer */
buflen = len + outheader - > arglen ;
2005-10-17 03:03:59 +04:00
* retbuf = dm_malloc ( buflen ) ;
2004-06-24 12:02:38 +04:00
if ( ! * retbuf ) {
errno = ENOMEM ;
return 0 ;
}
/* Copy the header */
memcpy ( * retbuf , outbuf , len ) ;
outheader = ( struct clvm_header * ) * retbuf ;
/* Read the returned values */
off = 1 ; /* we've already read the first byte */
2005-01-07 17:22:49 +03:00
while ( off < = outheader - > arglen & & len > 0 ) {
2004-06-24 12:02:38 +04:00
len = read ( _clvmd_sock , outheader - > args + off ,
buflen - off - offsetof ( struct clvm_header , args ) ) ;
if ( len > 0 )
off + = len ;
}
/* Was it an error ? */
2005-01-21 14:35:24 +03:00
if ( outheader - > status ! = 0 ) {
errno = outheader - > status ;
/* Only return an error here if there are no node-specific
errors present in the message that might have more detail */
if ( ! ( outheader - > flags & CLVMD_FLAG_NODEERRS ) ) {
log_error ( " cluster request failed: %s " , strerror ( errno ) ) ;
return 0 ;
}
2004-06-24 12:02:38 +04:00
}
return 1 ;
}
/* Build the structure header and parse-out wildcard node names */
2008-12-16 15:30:39 +03:00
/* FIXME: Cleanup implicit casts of clvmd_cmd (int, char, uint8_t, etc). */
static void _build_header ( struct clvm_header * head , int clvmd_cmd , const char * node ,
2004-06-24 12:02:38 +04:00
int len )
{
2008-12-16 15:30:39 +03:00
head - > cmd = clvmd_cmd ;
2004-06-24 12:02:38 +04:00
head - > status = 0 ;
head - > flags = 0 ;
head - > clientid = 0 ;
head - > arglen = len ;
if ( node ) {
/*
* Allow a couple of special node names :
* " * " for all nodes ,
* " . " for the local node only
*/
if ( strcmp ( node , " * " ) = = 0 ) {
head - > node [ 0 ] = ' \0 ' ;
} else if ( strcmp ( node , " . " ) = = 0 ) {
head - > node [ 0 ] = ' \0 ' ;
head - > flags = CLVMD_FLAG_LOCAL ;
} else
strcpy ( head - > node , node ) ;
} else
head - > node [ 0 ] = ' \0 ' ;
}
/*
* Send a message to a ( or all ) node ( s ) in the cluster and wait for replies
*/
2008-12-16 15:30:39 +03:00
static int _cluster_request ( char clvmd_cmd , const char * node , void * data , int len ,
2004-06-24 12:02:38 +04:00
lvm_response_t * * response , int * num )
{
2006-12-01 02:11:42 +03:00
char outbuf [ sizeof ( struct clvm_header ) + len + strlen ( node ) + 1 ] __attribute ( ( aligned ( 8 ) ) ) ;
2004-06-24 12:02:38 +04:00
char * inptr ;
char * retbuf = NULL ;
int status ;
int i ;
int num_responses = 0 ;
struct clvm_header * head = ( struct clvm_header * ) outbuf ;
lvm_response_t * rarray ;
* num = 0 ;
if ( _clvmd_sock = = - 1 )
_clvmd_sock = _open_local_sock ( ) ;
if ( _clvmd_sock = = - 1 )
return 0 ;
2008-12-16 15:30:39 +03:00
_build_header ( head , clvmd_cmd , node , len ) ;
2004-06-24 12:02:38 +04:00
memcpy ( head - > node + strlen ( head - > node ) + 1 , data , len ) ;
status = _send_request ( outbuf , sizeof ( struct clvm_header ) +
strlen ( head - > node ) + len , & retbuf ) ;
if ( ! status )
goto out ;
/* Count the number of responses we got */
head = ( struct clvm_header * ) retbuf ;
inptr = head - > args ;
while ( inptr [ 0 ] ) {
num_responses + + ;
inptr + = strlen ( inptr ) + 1 ;
inptr + = sizeof ( int ) ;
inptr + = strlen ( inptr ) + 1 ;
}
/*
* Allocate response array .
* With an extra pair of INTs on the front to sanity
* check the pointer when we are given it back to free
*/
2006-12-02 02:10:26 +03:00
* response = dm_malloc ( sizeof ( lvm_response_t ) * num_responses ) ;
if ( ! * response ) {
2004-06-24 12:02:38 +04:00
errno = ENOMEM ;
status = 0 ;
goto out ;
}
rarray = * response ;
/* Unpack the response into an lvm_response_t array */
inptr = head - > args ;
i = 0 ;
while ( inptr [ 0 ] ) {
strcpy ( rarray [ i ] . node , inptr ) ;
inptr + = strlen ( inptr ) + 1 ;
2006-06-12 13:46:35 +04:00
memcpy ( & rarray [ i ] . status , inptr , sizeof ( int ) ) ;
2004-06-24 12:02:38 +04:00
inptr + = sizeof ( int ) ;
2005-10-17 03:03:59 +04:00
rarray [ i ] . response = dm_malloc ( strlen ( inptr ) + 1 ) ;
2004-06-24 12:02:38 +04:00
if ( rarray [ i ] . response = = NULL ) {
/* Free up everything else and return error */
int j ;
for ( j = 0 ; j < i ; j + + )
2005-10-17 03:03:59 +04:00
dm_free ( rarray [ i ] . response ) ;
2006-12-02 02:10:26 +03:00
free ( * response ) ;
2004-06-24 12:02:38 +04:00
errno = ENOMEM ;
status = - 1 ;
goto out ;
}
strcpy ( rarray [ i ] . response , inptr ) ;
rarray [ i ] . len = strlen ( inptr ) ;
inptr + = strlen ( inptr ) + 1 ;
i + + ;
}
* num = num_responses ;
* response = rarray ;
out :
if ( retbuf )
2005-10-17 03:03:59 +04:00
dm_free ( retbuf ) ;
2004-06-24 12:02:38 +04:00
return status ;
}
/* Free reply array */
2006-12-02 02:10:26 +03:00
static int _cluster_free_request ( lvm_response_t * response , int num )
2004-06-24 12:02:38 +04:00
{
int i ;
for ( i = 0 ; i < num ; i + + ) {
2005-10-17 03:03:59 +04:00
dm_free ( response [ i ] . response ) ;
2004-06-24 12:02:38 +04:00
}
2006-12-02 02:10:26 +03:00
dm_free ( response ) ;
2004-06-24 12:02:38 +04:00
return 1 ;
}
2009-06-12 12:30:19 +04:00
static int _lock_for_cluster ( struct cmd_context * cmd , unsigned char clvmd_cmd ,
uint32_t flags , const char * name )
2004-06-24 12:02:38 +04:00
{
int status ;
int i ;
char * args ;
const char * node = " " ;
int len ;
2010-03-26 18:40:13 +03:00
int dmeventd_mode ;
2004-06-24 12:02:38 +04:00
int saved_errno = errno ;
lvm_response_t * response = NULL ;
int num_responses ;
assert ( name ) ;
len = strlen ( name ) + 3 ;
args = alloca ( len ) ;
strcpy ( args + 2 , name ) ;
2009-12-09 21:28:27 +03:00
/* Maskoff lock flags */
args [ 0 ] = flags & ( LCK_SCOPE_MASK | LCK_TYPE_MASK | LCK_NONBLOCK | LCK_HOLD ) ;
args [ 1 ] = flags & ( LCK_LOCAL | LCK_CLUSTER_VG ) ;
2004-06-24 12:02:38 +04:00
2006-05-12 17:33:22 +04:00
if ( mirror_in_sync ( ) )
2006-05-11 23:05:21 +04:00
args [ 1 ] | = LCK_MIRROR_NOSYNC_MODE ;
2010-03-26 18:40:13 +03:00
/*
* Must handle tri - state return from dmeventd_monitor_mode .
* But DMEVENTD_MONITOR_IGNORE is not propagated across the cluster .
*/
dmeventd_mode = dmeventd_monitor_mode ( ) ;
if ( dmeventd_mode ! = DMEVENTD_MONITOR_IGNORE & & dmeventd_mode )
2007-01-20 01:21:45 +03:00
args [ 1 ] | = LCK_DMEVENTD_MONITOR_MODE ;
2006-05-12 23:16:48 +04:00
2009-06-12 12:30:19 +04:00
if ( cmd - > partial_activation )
args [ 1 ] | = LCK_PARTIAL_MODE ;
2004-06-24 12:02:38 +04:00
/*
* VG locks are just that : locks , and have no side effects
* so we only need to do them on the local node because all
* locks are cluster - wide .
2005-01-21 14:35:24 +03:00
* Also , if the lock is exclusive it makes no sense to try to
2004-06-24 12:02:38 +04:00
* acquire it on all nodes , so just do that on the local node too .
2008-01-30 17:00:02 +03:00
* One exception , is that P_ locks / do / get distributed across
2007-08-23 19:43:20 +04:00
* the cluster because they might have side - effects .
2004-06-24 12:02:38 +04:00
*/
2007-08-23 19:43:20 +04:00
if ( strncmp ( name , " P_ " , 2 ) & &
2008-12-16 15:30:39 +03:00
( clvmd_cmd = = CLVMD_CMD_LOCK_VG | |
2007-08-23 19:43:20 +04:00
( flags & LCK_TYPE_MASK ) = = LCK_EXCL | |
( flags & LCK_LOCAL ) | |
! ( flags & LCK_CLUSTER_VG ) ) )
2004-06-24 12:02:38 +04:00
node = " . " ;
2008-12-16 15:30:39 +03:00
status = _cluster_request ( clvmd_cmd , node , args , len ,
2004-06-24 12:02:38 +04:00
& response , & num_responses ) ;
/* If any nodes were down then display them and return an error */
for ( i = 0 ; i < num_responses ; i + + ) {
2005-01-21 14:35:24 +03:00
if ( response [ i ] . status = = EHOSTDOWN ) {
2004-06-24 12:02:38 +04:00
log_error ( " clvmd not running on node %s " ,
response [ i ] . node ) ;
status = 0 ;
2005-01-21 14:35:24 +03:00
errno = response [ i ] . status ;
2004-06-24 12:02:38 +04:00
} else if ( response [ i ] . status ) {
log_error ( " Error locking on node %s: %s " ,
response [ i ] . node ,
response [ i ] . response [ 0 ] ?
response [ i ] . response :
strerror ( response [ i ] . status ) ) ;
status = 0 ;
2005-01-21 14:35:24 +03:00
errno = response [ i ] . status ;
2004-06-24 12:02:38 +04:00
}
}
saved_errno = errno ;
2006-12-02 02:10:26 +03:00
_cluster_free_request ( response , num_responses ) ;
2004-06-24 12:02:38 +04:00
errno = saved_errno ;
return status ;
}
/* API entry point for LVM */
# ifdef CLUSTER_LOCKING_INTERNAL
static int _lock_resource ( struct cmd_context * cmd , const char * resource ,
2007-08-22 18:38:18 +04:00
uint32_t flags )
2004-06-24 12:02:38 +04:00
# else
2007-08-22 18:38:18 +04:00
int lock_resource ( struct cmd_context * cmd , const char * resource , uint32_t flags )
2004-06-24 12:02:38 +04:00
# endif
{
char lockname [ PATH_MAX ] ;
2008-12-16 15:30:39 +03:00
int clvmd_cmd = 0 ;
2007-11-17 00:16:20 +03:00
const char * lock_scope ;
const char * lock_type = " " ;
2004-06-24 12:02:38 +04:00
assert ( strlen ( resource ) < sizeof ( lockname ) ) ;
2006-05-10 21:49:25 +04:00
assert ( resource ) ;
2004-06-24 12:02:38 +04:00
switch ( flags & LCK_SCOPE_MASK ) {
case LCK_VG :
2009-04-22 13:39:45 +04:00
if ( flags = = LCK_VG_BACKUP ) {
log_very_verbose ( " Requesting backup of VG metadata for %s " ,
resource ) ;
2009-06-12 12:30:19 +04:00
return _lock_for_cluster ( cmd , CLVMD_CMD_VG_BACKUP ,
2009-04-22 13:39:45 +04:00
LCK_CLUSTER_VG , resource ) ;
}
2004-06-24 12:02:38 +04:00
/* If the VG name is empty then lock the unused PVs */
2010-05-19 06:36:33 +04:00
if ( is_orphan_vg ( resource ) | | is_global_vg ( resource ) | | ( flags & LCK_CACHE ) )
2008-05-09 22:45:15 +04:00
dm_snprintf ( lockname , sizeof ( lockname ) , " P_%s " ,
resource ) ;
2004-06-24 12:02:38 +04:00
else
2006-08-21 16:54:53 +04:00
dm_snprintf ( lockname , sizeof ( lockname ) , " V_%s " ,
2008-05-09 22:45:15 +04:00
resource ) ;
2004-06-24 12:02:38 +04:00
2007-11-17 00:16:20 +03:00
lock_scope = " VG " ;
2008-12-16 15:30:39 +03:00
clvmd_cmd = CLVMD_CMD_LOCK_VG ;
2010-04-13 18:36:24 +04:00
/*
* Old clvmd does not expect LCK_HOLD which was already processed
* in lock_vol , mask it for compatibility reasons .
*/
if ( flags ! = LCK_VG_COMMIT & & flags ! = LCK_VG_REVERT )
flags & = ~ LCK_HOLD ;
2004-06-24 12:02:38 +04:00
break ;
case LCK_LV :
2008-12-16 15:30:39 +03:00
clvmd_cmd = CLVMD_CMD_LOCK_LV ;
2004-06-24 12:02:38 +04:00
strcpy ( lockname , resource ) ;
2007-11-17 00:16:20 +03:00
lock_scope = " LV " ;
2009-12-09 21:16:38 +03:00
flags & = ~ LCK_HOLD ; /* Mask off HOLD flag */
2004-06-24 12:02:38 +04:00
break ;
default :
log_error ( " Unrecognised lock scope: %d " ,
flags & LCK_SCOPE_MASK ) ;
return 0 ;
}
2007-11-17 00:16:20 +03:00
switch ( flags & LCK_TYPE_MASK ) {
case LCK_UNLOCK :
lock_type = " UN " ;
break ;
case LCK_NULL :
lock_type = " NL " ;
break ;
case LCK_READ :
lock_type = " CR " ;
break ;
case LCK_PREAD :
lock_type = " PR " ;
break ;
case LCK_WRITE :
lock_type = " PW " ;
break ;
case LCK_EXCL :
lock_type = " EX " ;
break ;
default :
log_error ( " Unrecognised lock type: %u " ,
flags & LCK_TYPE_MASK ) ;
return 0 ;
}
2010-01-05 19:03:37 +03:00
log_very_verbose ( " Locking %s %s %s (%s%s%s%s%s%s) (0x%x) " , lock_scope , lockname ,
lock_type , lock_scope ,
flags & LCK_NONBLOCK ? " |NONBLOCK " : " " ,
flags & LCK_HOLD ? " |HOLD " : " " ,
flags & LCK_LOCAL ? " |LOCAL " : " " ,
flags & LCK_CLUSTER_VG ? " |CLUSTER " : " " ,
flags & LCK_CACHE ? " |CACHE " : " " ,
2007-11-17 00:16:20 +03:00
flags ) ;
2004-06-24 12:02:38 +04:00
2007-11-17 00:16:20 +03:00
/* Send a message to the cluster manager */
2009-06-12 12:30:19 +04:00
return _lock_for_cluster ( cmd , clvmd_cmd , flags , lockname ) ;
2004-06-24 12:02:38 +04:00
}
2009-05-19 14:38:58 +04:00
static int decode_lock_type ( const char * response )
{
if ( ! response )
return LCK_NULL ;
else if ( strcmp ( response , " EX " ) )
return LCK_EXCL ;
else if ( strcmp ( response , " CR " ) )
return LCK_READ ;
else if ( strcmp ( response , " PR " ) )
return LCK_PREAD ;
stack ;
return 0 ;
}
# ifdef CLUSTER_LOCKING_INTERNAL
2009-05-21 07:04:52 +04:00
static int _query_resource ( const char * resource , int * mode )
2009-05-19 14:38:58 +04:00
# else
2009-05-21 07:04:52 +04:00
int query_resource ( const char * resource , int * mode )
2009-05-19 14:38:58 +04:00
# endif
{
int i , status , len , num_responses , saved_errno ;
const char * node = " " ;
char * args ;
lvm_response_t * response = NULL ;
saved_errno = errno ;
len = strlen ( resource ) + 3 ;
args = alloca ( len ) ;
strcpy ( args + 2 , resource ) ;
args [ 0 ] = 0 ;
args [ 1 ] = LCK_CLUSTER_VG ;
status = _cluster_request ( CLVMD_CMD_LOCK_QUERY , node , args , len ,
& response , & num_responses ) ;
* mode = LCK_NULL ;
for ( i = 0 ; i < num_responses ; i + + ) {
if ( response [ i ] . status = = EHOSTDOWN )
continue ;
if ( ! response [ i ] . response [ 0 ] )
continue ;
/*
* All nodes should use CR , or exactly one node
* should held EX . ( PR is obsolete )
* If two nodes node reports different locks ,
* something is broken - just return more important mode .
*/
if ( decode_lock_type ( response [ i ] . response ) > * mode )
* mode = decode_lock_type ( response [ i ] . response ) ;
log_debug ( " Lock held for %s, node %s : %s " , resource ,
response [ i ] . node , response [ i ] . response ) ;
}
_cluster_free_request ( response , num_responses ) ;
errno = saved_errno ;
return status ;
}
2004-06-24 12:02:38 +04:00
# ifdef CLUSTER_LOCKING_INTERNAL
static void _locking_end ( void )
# else
void locking_end ( void )
# endif
{
if ( _clvmd_sock ! = - 1 & & close ( _clvmd_sock ) )
stack ;
_clvmd_sock = - 1 ;
}
# ifdef CLUSTER_LOCKING_INTERNAL
static void _reset_locking ( void )
# else
void reset_locking ( void )
# endif
{
if ( close ( _clvmd_sock ) )
stack ;
_clvmd_sock = _open_local_sock ( ) ;
if ( _clvmd_sock = = - 1 )
2008-01-30 17:00:02 +03:00
stack ;
2004-06-24 12:02:38 +04:00
}
# ifdef CLUSTER_LOCKING_INTERNAL
2006-05-16 20:48:31 +04:00
int init_cluster_locking ( struct locking_type * locking , struct cmd_context * cmd )
2004-06-24 12:02:38 +04:00
{
locking - > lock_resource = _lock_resource ;
2009-05-21 07:04:52 +04:00
locking - > query_resource = _query_resource ;
2004-06-24 12:02:38 +04:00
locking - > fin_locking = _locking_end ;
locking - > reset_locking = _reset_locking ;
2005-03-22 01:55:12 +03:00
locking - > flags = LCK_PRE_MEMLOCK | LCK_CLUSTERED ;
2004-06-24 12:02:38 +04:00
_clvmd_sock = _open_local_sock ( ) ;
if ( _clvmd_sock = = - 1 )
return 0 ;
return 1 ;
}
# else
int locking_init ( int type , struct config_tree * cf , uint32_t * flags )
{
_clvmd_sock = _open_local_sock ( ) ;
if ( _clvmd_sock = = - 1 )
return 0 ;
/* Ask LVM to lock memory before calling us */
* flags | = LCK_PRE_MEMLOCK ;
2005-03-22 01:55:12 +03:00
* flags | = LCK_CLUSTERED ;
2004-06-24 12:02:38 +04:00
return 1 ;
}
# endif