2000-06-10 14:29:31 +00:00
/*
2002-01-30 06:08:46 +00:00
Unix SMB / CIFS implementation .
2000-06-10 14:29:31 +00:00
kernel oplock processing for Linux
Copyright ( C ) Andrew Tridgell 2000
This program is free software ; you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
2007-07-09 19:25:36 +00:00
the Free Software Foundation ; either version 3 of the License , or
2000-06-10 14:29:31 +00:00
( at your option ) any later version .
This program is distributed in the hope that it will be useful ,
but WITHOUT ANY WARRANTY ; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
You should have received a copy of the GNU General Public License
2007-07-10 00:52:41 +00:00
along with this program . If not , see < http : //www.gnu.org/licenses/>.
2000-06-10 14:29:31 +00:00
*/
2006-05-05 02:06:37 +00:00
# define DBGC_CLASS DBGC_LOCKING
2000-06-10 14:29:31 +00:00
# include "includes.h"
2000-06-11 05:57:58 +00:00
# if HAVE_KERNEL_OPLOCKS_LINUX
2005-04-06 16:28:04 +00:00
/* these can be removed when they are in glibc headers */
struct cap_user_header {
uint32 version ;
int pid ;
} header ;
struct cap_user_data {
uint32 effective ;
uint32 permitted ;
uint32 inheritable ;
} data ;
extern int capget ( struct cap_user_header * hdrp ,
struct cap_user_data * datap ) ;
extern int capset ( struct cap_user_header * hdrp ,
const struct cap_user_data * datap ) ;
2002-07-15 10:35:28 +00:00
static SIG_ATOMIC_T signals_received ;
# define FD_PENDING_SIZE 100
static SIG_ATOMIC_T fd_pending_array [ FD_PENDING_SIZE ] ;
2000-06-10 14:29:31 +00:00
2000-06-11 06:24:54 +00:00
# ifndef F_SETLEASE
# define F_SETLEASE 1024
# endif
# ifndef F_GETLEASE
# define F_GETLEASE 1025
# endif
# ifndef CAP_LEASE
# define CAP_LEASE 28
# endif
2000-06-11 05:57:58 +00:00
totally rewrote the async signal, notification and oplock notification
handling in Samba. This was needed due to several limitations and
races in the previous code - as a side effect the new code is much
cleaner :)
in summary:
- changed sys_select() to avoid a signal/select race condition. It is a
rare race but once we have signals doing notification and oplocks it
is important.
- changed our main processing loop to take advantage of the new
sys_select semantics
- split the notify code into implementaion dependent and general
parts. Added the following structure that defines an implementation:
struct cnotify_fns {
void * (*register_notify)(connection_struct *conn, char *path, uint32 flags);
BOOL (*check_notify)(connection_struct *conn, uint16 vuid, char *path, uint32 flags, void *data, time_t t);
void (*remove_notify)(void *data);
};
then I wrote two implementations, one using hash/poll (like our old
code) and the other using the new Linux kernel change notify. It
should be easy to add other change notify implementations by creating
a sructure of the above type.
- fixed a bug in change notify where we were returning the wrong error
code.
- rewrote the core change notify code to be much simpler
- moved to real-time signals for leases and change notify
Amazingly, it all seems to work. I was very surprised!
(This used to be commit 44766c39e0027c762bee8b33b12c621c109a3267)
2000-06-12 15:53:31 +00:00
# ifndef RT_SIGNAL_LEASE
2003-03-28 01:07:05 +00:00
# define RT_SIGNAL_LEASE (SIGRTMIN+1)
totally rewrote the async signal, notification and oplock notification
handling in Samba. This was needed due to several limitations and
races in the previous code - as a side effect the new code is much
cleaner :)
in summary:
- changed sys_select() to avoid a signal/select race condition. It is a
rare race but once we have signals doing notification and oplocks it
is important.
- changed our main processing loop to take advantage of the new
sys_select semantics
- split the notify code into implementaion dependent and general
parts. Added the following structure that defines an implementation:
struct cnotify_fns {
void * (*register_notify)(connection_struct *conn, char *path, uint32 flags);
BOOL (*check_notify)(connection_struct *conn, uint16 vuid, char *path, uint32 flags, void *data, time_t t);
void (*remove_notify)(void *data);
};
then I wrote two implementations, one using hash/poll (like our old
code) and the other using the new Linux kernel change notify. It
should be easy to add other change notify implementations by creating
a sructure of the above type.
- fixed a bug in change notify where we were returning the wrong error
code.
- rewrote the core change notify code to be much simpler
- moved to real-time signals for leases and change notify
Amazingly, it all seems to work. I was very surprised!
(This used to be commit 44766c39e0027c762bee8b33b12c621c109a3267)
2000-06-12 15:53:31 +00:00
# endif
2000-06-12 17:06:00 +00:00
# ifndef F_SETSIG
# define F_SETSIG 10
# endif
2000-06-10 14:29:31 +00:00
/****************************************************************************
2001-10-20 21:59:34 +00:00
Handle a LEASE signal , incrementing the signals_received and blocking the signal .
2000-06-10 14:29:31 +00:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2001-05-08 06:14:08 +00:00
static void signal_handler ( int sig , siginfo_t * info , void * unused )
2000-06-10 14:29:31 +00:00
{
2002-07-15 10:35:28 +00:00
if ( signals_received < FD_PENDING_SIZE - 1 ) {
fd_pending_array [ signals_received ] = ( SIG_ATOMIC_T ) info - > si_fd ;
signals_received + + ;
} /* Else signal is lost. */
2005-06-09 15:20:11 +00:00
sys_select_signal ( RT_SIGNAL_LEASE ) ;
2000-06-10 14:29:31 +00:00
}
2000-06-11 05:57:58 +00:00
/****************************************************************************
2001-10-20 21:59:34 +00:00
Try to gain a linux capability .
2001-09-08 02:59:23 +00:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2001-09-08 02:59:23 +00:00
static void set_capability ( unsigned capability )
2000-06-11 05:57:58 +00:00
{
2000-06-11 06:24:54 +00:00
# ifndef _LINUX_CAPABILITY_VERSION
# define _LINUX_CAPABILITY_VERSION 0x19980330
# endif
header . version = _LINUX_CAPABILITY_VERSION ;
header . pid = 0 ;
if ( capget ( & header , & data ) = = - 1 ) {
2006-08-28 18:25:55 +00:00
DEBUG ( 3 , ( " Unable to get kernel capabilities (%s) \n " ,
strerror ( errno ) ) ) ;
2000-06-11 05:57:58 +00:00
return ;
}
2000-06-11 06:24:54 +00:00
data . effective | = ( 1 < < capability ) ;
if ( capset ( & header , & data ) = = - 1 ) {
DEBUG ( 3 , ( " Unable to set %d capability (%s) \n " ,
capability , strerror ( errno ) ) ) ;
2000-06-11 05:57:58 +00:00
}
}
2007-02-14 02:37:14 +00:00
/*
Call to set the kernel lease signal handler
*/
int linux_set_lease_sighandler ( int fd )
{
if ( fcntl ( fd , F_SETSIG , RT_SIGNAL_LEASE ) = = - 1 ) {
DEBUG ( 3 , ( " Failed to set signal handler for kernel lease \n " ) ) ;
return - 1 ;
}
return 0 ;
}
2000-06-11 05:57:58 +00:00
/****************************************************************************
2006-01-06 10:27:12 +00:00
Call SETLEASE . If we get EACCES then we try setting up the right capability and
2007-02-14 02:37:14 +00:00
try again .
Use the SMB_VFS_LINUX_SETLEASE instead of this call directly .
2000-06-11 05:57:58 +00:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2007-02-14 02:37:14 +00:00
int linux_setlease ( int fd , int leasetype )
2000-06-11 05:57:58 +00:00
{
int ret ;
2000-06-12 17:06:00 +00:00
2006-01-06 10:27:12 +00:00
ret = fcntl ( fd , F_SETLEASE , leasetype ) ;
2000-06-11 05:57:58 +00:00
if ( ret = = - 1 & & errno = = EACCES ) {
2000-06-11 06:24:54 +00:00
set_capability ( CAP_LEASE ) ;
2000-06-11 05:57:58 +00:00
ret = fcntl ( fd , F_SETLEASE , leasetype ) ;
}
return ret ;
}
2000-06-10 14:29:31 +00:00
/****************************************************************************
* Deal with the Linux kernel < - - > smbd
* oplock break protocol .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2005-09-30 17:13:37 +00:00
static files_struct * linux_oplock_receive_message ( fd_set * fds )
2000-06-10 14:29:31 +00:00
{
2002-07-15 10:35:28 +00:00
int fd ;
2005-09-30 17:13:37 +00:00
files_struct * fsp ;
2000-06-10 14:29:31 +00:00
2002-07-15 10:35:28 +00:00
BlockSignals ( True , RT_SIGNAL_LEASE ) ;
fd = fd_pending_array [ 0 ] ;
fsp = file_find_fd ( fd ) ;
fd_pending_array [ 0 ] = ( SIG_ATOMIC_T ) - 1 ;
if ( signals_received > 1 )
2005-03-31 05:06:04 +00:00
memmove ( CONST_DISCARD ( void * , & fd_pending_array [ 0 ] ) ,
CONST_DISCARD ( void * , & fd_pending_array [ 1 ] ) ,
2002-07-15 10:35:28 +00:00
sizeof ( SIG_ATOMIC_T ) * ( signals_received - 1 ) ) ;
signals_received - - ;
/* now we can receive more signals */
BlockSignals ( False , RT_SIGNAL_LEASE ) ;
2000-06-10 14:29:31 +00:00
2005-09-30 17:13:37 +00:00
return fsp ;
2000-06-10 14:29:31 +00:00
}
/****************************************************************************
Attempt to set an kernel oplock on a file .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2000-06-10 14:29:31 +00:00
static BOOL linux_set_kernel_oplock ( files_struct * fsp , int oplock_type )
{
2007-02-14 02:37:14 +00:00
if ( SMB_VFS_LINUX_SETLEASE ( fsp , fsp - > fh - > fd , F_WRLCK ) = = - 1 ) {
2006-08-28 18:25:55 +00:00
DEBUG ( 3 , ( " linux_set_kernel_oplock: Refused oplock on file %s, "
2007-05-29 09:30:34 +00:00
" fd = %d, file_id = %s. (%s) \n " ,
2005-07-08 04:51:27 +00:00
fsp - > fsp_name , fsp - > fh - > fd ,
2007-09-10 10:56:07 +00:00
file_id_string_tos ( & fsp - > file_id ) ,
2006-08-28 18:25:55 +00:00
strerror ( errno ) ) ) ;
2000-06-10 14:29:31 +00:00
return False ;
}
2006-08-28 18:25:55 +00:00
DEBUG ( 3 , ( " linux_set_kernel_oplock: got kernel oplock on file %s, "
2007-05-29 09:30:34 +00:00
" file_id = %s gen_id = %lu \n " ,
2007-09-10 10:56:07 +00:00
fsp - > fsp_name , file_id_string_tos ( & fsp - > file_id ) ,
2007-05-29 09:30:34 +00:00
fsp - > fh - > gen_id ) ) ;
2000-06-10 14:29:31 +00:00
return True ;
}
/****************************************************************************
Release a kernel oplock on a file .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2000-06-10 14:29:31 +00:00
static void linux_release_kernel_oplock ( files_struct * fsp )
{
if ( DEBUGLVL ( 10 ) ) {
/*
* Check and print out the current kernel
* oplock state of this file .
*/
2005-07-08 04:51:27 +00:00
int state = fcntl ( fsp - > fh - > fd , F_GETLEASE , 0 ) ;
2007-05-29 09:30:34 +00:00
dbgtext ( " linux_release_kernel_oplock: file %s, file_id = %s "
" gen_id = %lu has kernel oplock state "
2007-09-10 10:56:07 +00:00
" of %x. \n " , fsp - > fsp_name , file_id_string_tos ( & fsp - > file_id ) ,
2007-05-29 09:30:34 +00:00
fsp - > fh - > gen_id , state ) ;
2000-06-10 14:29:31 +00:00
}
/*
* Remove the kernel oplock on this file .
*/
2007-02-14 02:37:14 +00:00
if ( SMB_VFS_LINUX_SETLEASE ( fsp , fsp - > fh - > fd , F_UNLCK ) = = - 1 ) {
2000-06-10 14:29:31 +00:00
if ( DEBUGLVL ( 0 ) ) {
2006-08-28 18:25:55 +00:00
dbgtext ( " linux_release_kernel_oplock: Error when "
" removing kernel oplock on file " ) ;
2007-05-29 09:30:34 +00:00
dbgtext ( " %s, file_id = %s, gen_id = %lu. "
2006-08-28 18:25:55 +00:00
" Error was %s \n " , fsp - > fsp_name ,
2007-09-10 10:56:07 +00:00
file_id_string_tos ( & fsp - > file_id ) ,
2007-05-29 09:30:34 +00:00
fsp - > fh - > gen_id , strerror ( errno ) ) ;
2000-06-10 14:29:31 +00:00
}
}
}
/****************************************************************************
2001-10-20 21:59:34 +00:00
See if a oplock message is waiting .
2000-06-10 14:29:31 +00:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2000-06-10 14:29:31 +00:00
static BOOL linux_oplock_msg_waiting ( fd_set * fds )
{
2002-07-15 10:35:28 +00:00
return signals_received ! = 0 ;
2000-06-10 14:29:31 +00:00
}
2000-06-11 06:46:05 +00:00
/****************************************************************************
2001-10-20 21:59:34 +00:00
See if the kernel supports oplocks .
2000-06-11 06:46:05 +00:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2000-06-11 06:46:05 +00:00
static BOOL linux_oplocks_available ( void )
{
int fd , ret ;
fd = open ( " /dev/null " , O_RDONLY ) ;
2001-10-20 21:59:34 +00:00
if ( fd = = - 1 )
return False ; /* uggh! */
2000-06-11 06:46:05 +00:00
ret = fcntl ( fd , F_GETLEASE , 0 ) ;
close ( fd ) ;
return ret = = F_UNLCK ;
}
2000-06-10 14:29:31 +00:00
/****************************************************************************
2001-10-20 21:59:34 +00:00
Setup kernel oplocks .
2000-06-10 14:29:31 +00:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2001-10-20 21:59:34 +00:00
2000-06-10 14:29:31 +00:00
struct kernel_oplocks * linux_init_kernel_oplocks ( void )
{
static struct kernel_oplocks koplocks ;
struct sigaction act ;
2000-06-11 06:46:05 +00:00
if ( ! linux_oplocks_available ( ) ) {
DEBUG ( 3 , ( " Linux kernel oplocks not available \n " ) ) ;
return NULL ;
}
2003-01-14 07:26:12 +00:00
ZERO_STRUCT ( act ) ;
2001-10-20 21:59:34 +00:00
act . sa_handler = NULL ;
act . sa_sigaction = signal_handler ;
act . sa_flags = SA_SIGINFO ;
2003-05-15 17:37:52 +00:00
sigemptyset ( & act . sa_mask ) ;
2001-10-20 21:59:34 +00:00
if ( sigaction ( RT_SIGNAL_LEASE , & act , NULL ) ! = 0 ) {
totally rewrote the async signal, notification and oplock notification
handling in Samba. This was needed due to several limitations and
races in the previous code - as a side effect the new code is much
cleaner :)
in summary:
- changed sys_select() to avoid a signal/select race condition. It is a
rare race but once we have signals doing notification and oplocks it
is important.
- changed our main processing loop to take advantage of the new
sys_select semantics
- split the notify code into implementaion dependent and general
parts. Added the following structure that defines an implementation:
struct cnotify_fns {
void * (*register_notify)(connection_struct *conn, char *path, uint32 flags);
BOOL (*check_notify)(connection_struct *conn, uint16 vuid, char *path, uint32 flags, void *data, time_t t);
void (*remove_notify)(void *data);
};
then I wrote two implementations, one using hash/poll (like our old
code) and the other using the new Linux kernel change notify. It
should be easy to add other change notify implementations by creating
a sructure of the above type.
- fixed a bug in change notify where we were returning the wrong error
code.
- rewrote the core change notify code to be much simpler
- moved to real-time signals for leases and change notify
Amazingly, it all seems to work. I was very surprised!
(This used to be commit 44766c39e0027c762bee8b33b12c621c109a3267)
2000-06-12 15:53:31 +00:00
DEBUG ( 0 , ( " Failed to setup RT_SIGNAL_LEASE handler \n " ) ) ;
2000-06-10 14:29:31 +00:00
return NULL ;
2001-10-20 21:59:34 +00:00
}
2000-06-10 14:29:31 +00:00
koplocks . receive_message = linux_oplock_receive_message ;
koplocks . set_oplock = linux_set_kernel_oplock ;
koplocks . release_oplock = linux_release_kernel_oplock ;
koplocks . msg_waiting = linux_oplock_msg_waiting ;
koplocks . notification_fd = - 1 ;
2003-03-28 01:07:05 +00:00
/* the signal can start off blocked due to a bug in bash */
BlockSignals ( False , RT_SIGNAL_LEASE ) ;
2000-06-12 17:06:00 +00:00
DEBUG ( 3 , ( " Linux kernel oplocks enabled \n " ) ) ;
2000-06-10 14:29:31 +00:00
return & koplocks ;
}
# else
2005-05-02 17:49:43 +00:00
void oplock_linux_dummy ( void ) ;
2000-06-10 14:29:31 +00:00
void oplock_linux_dummy ( void ) { }
# endif /* HAVE_KERNEL_OPLOCKS_LINUX */