2008-02-21 16:14:08 +01:00
/*
* Simulate the Posix AIO using mmap / fork
*
* Copyright ( C ) Volker Lendecke 2008
2010-06-04 21:00:24 -07:00
* Copyright ( C ) Jeremy Allison 2010
2008-02-21 16:14:08 +01:00
*
* This program is free software ; you can redistribute it and / or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation ; either version 2 of the License , or
* ( at your option ) any later version .
*
* This program is distributed in the hope that it will be useful ,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
* GNU General Public License for more details .
*
* You should have received a copy of the GNU General Public License
* along with this program ; if not , write to the Free Software
* Foundation , Inc . , 675 Mass Ave , Cambridge , MA 0213 9 , USA .
*/
# include "includes.h"
2011-03-30 22:24:18 +02:00
# include "system/filesys.h"
2011-02-25 17:03:27 +01:00
# include "system/shmem.h"
2011-03-30 22:24:18 +02:00
# include "smbd/smbd.h"
2012-04-08 21:49:59 +02:00
# include "smbd/globals.h"
2012-07-09 11:10:30 +02:00
# include "lib/async_req/async_sock.h"
# include "lib/util/tevent_unix.h"
2015-10-12 15:57:34 +02:00
# include "lib/util/sys_rw.h"
# include "lib/util/sys_rw_data.h"
2016-05-14 09:45:49 +02:00
# include "lib/util/msghdr.h"
2016-03-28 10:19:49 +03:00
# include "smbprofile.h"
2021-01-03 21:53:49 +01:00
# include "lib/global_contexts.h"
2008-02-21 16:14:08 +01:00
2014-06-14 00:55:02 +02:00
# if !defined(HAVE_STRUCT_MSGHDR_MSG_CONTROL) && !defined(HAVE_STRUCT_MSGHDR_MSG_ACCRIGHTS)
2014-05-31 11:58:01 +02:00
# error Can not pass file descriptors
# endif
2012-07-16 12:44:42 +02:00
# undef recvmsg
2011-04-20 18:21:25 +02:00
# ifndef MAP_FILE
# define MAP_FILE 0
# endif
2017-12-07 20:53:18 +01:00
struct aio_child_list ;
2012-08-21 19:22:37 +10:00
struct aio_fork_config {
bool erratic_testing_mode ;
2017-12-07 20:53:18 +01:00
struct aio_child_list * children ;
2012-08-21 19:22:37 +10:00
} ;
2008-02-21 16:14:08 +01:00
struct mmap_area {
size_t size ;
2017-12-08 14:30:46 +01:00
void * ptr ;
2008-02-21 16:14:08 +01:00
} ;
static int mmap_area_destructor ( struct mmap_area * area )
{
2015-04-10 11:10:27 +02:00
munmap ( discard_const ( area - > ptr ) , area - > size ) ;
2008-02-21 16:14:08 +01:00
return 0 ;
}
static struct mmap_area * mmap_area_init ( TALLOC_CTX * mem_ctx , size_t size )
{
struct mmap_area * result ;
int fd ;
result = talloc ( mem_ctx , struct mmap_area ) ;
if ( result = = NULL ) {
DEBUG ( 0 , ( " talloc failed \n " ) ) ;
goto fail ;
}
fd = open ( " /dev/zero " , O_RDWR ) ;
if ( fd = = - 1 ) {
DEBUG ( 3 , ( " open( \" /dev/zero \" ) failed: %s \n " ,
strerror ( errno ) ) ) ;
goto fail ;
}
result - > ptr = mmap ( NULL , size , PROT_READ | PROT_WRITE ,
MAP_SHARED | MAP_FILE , fd , 0 ) ;
2013-02-20 09:16:25 +01:00
close ( fd ) ;
2008-02-21 16:14:08 +01:00
if ( result - > ptr = = MAP_FAILED ) {
DEBUG ( 1 , ( " mmap failed: %s \n " , strerror ( errno ) ) ) ;
goto fail ;
}
result - > size = size ;
talloc_set_destructor ( result , mmap_area_destructor ) ;
return result ;
fail :
TALLOC_FREE ( result ) ;
return NULL ;
}
2012-07-13 13:59:52 +02:00
enum cmd_type {
READ_CMD ,
2012-07-13 14:05:11 +02:00
WRITE_CMD ,
FSYNC_CMD
2012-07-13 13:59:52 +02:00
} ;
static const char * cmd_type_str ( enum cmd_type cmd )
{
const char * result ;
switch ( cmd ) {
case READ_CMD :
result = " READ " ;
break ;
case WRITE_CMD :
result = " WRITE " ;
break ;
2012-07-13 14:05:11 +02:00
case FSYNC_CMD :
result = " FSYNC " ;
break ;
2012-07-13 13:59:52 +02:00
default :
result = " <UNKNOWN> " ;
break ;
}
return result ;
}
2008-02-21 16:14:08 +01:00
struct rw_cmd {
size_t n ;
2012-04-05 14:53:08 +10:00
off_t offset ;
2012-07-13 13:59:52 +02:00
enum cmd_type cmd ;
2012-08-21 19:22:37 +10:00
bool erratic_testing_mode ;
2008-02-21 16:14:08 +01:00
} ;
struct rw_ret {
ssize_t size ;
int ret_errno ;
2016-02-26 09:59:23 +01:00
uint64_t duration ;
2008-02-21 16:14:08 +01:00
} ;
struct aio_child_list ;
struct aio_child {
struct aio_child * prev , * next ;
struct aio_child_list * list ;
pid_t pid ;
int sockfd ;
2012-07-09 11:10:30 +02:00
struct mmap_area * map ;
2008-02-21 16:14:08 +01:00
bool dont_delete ; /* Marked as in use since last cleanup */
2012-07-09 11:10:30 +02:00
bool busy ;
2008-02-21 16:14:08 +01:00
} ;
struct aio_child_list {
struct aio_child * children ;
2013-02-18 10:18:29 +01:00
struct tevent_timer * cleanup_event ;
2008-02-21 16:14:08 +01:00
} ;
static ssize_t read_fd ( int fd , void * ptr , size_t nbytes , int * recvfd )
{
struct iovec iov [ 1 ] ;
2015-05-03 09:27:16 +00:00
struct msghdr msg = { . msg_iov = iov , . msg_iovlen = 1 } ;
2008-02-21 16:14:08 +01:00
ssize_t n ;
2014-12-31 14:26:43 +01:00
size_t bufsize = msghdr_prep_recv_fds ( NULL , NULL , 0 , 1 ) ;
uint8_t buf [ bufsize ] ;
2008-02-21 16:14:08 +01:00
2014-12-31 14:26:43 +01:00
msghdr_prep_recv_fds ( & msg , buf , bufsize , 1 ) ;
2008-02-21 16:14:08 +01:00
2009-05-12 11:45:37 -07:00
iov [ 0 ] . iov_base = ( void * ) ptr ;
2008-02-21 16:14:08 +01:00
iov [ 0 ] . iov_len = nbytes ;
2014-12-31 14:27:03 +01:00
do {
n = recvmsg ( fd , & msg , 0 ) ;
} while ( ( n = = - 1 ) & & ( errno = = EINTR ) ) ;
if ( n < = 0 ) {
return n ;
2008-02-21 16:14:08 +01:00
}
2014-12-31 14:26:43 +01:00
{
size_t num_fds = msghdr_extract_fds ( & msg , NULL , 0 ) ;
int fds [ num_fds ] ;
msghdr_extract_fds ( & msg , fds , num_fds ) ;
if ( num_fds ! = 1 ) {
size_t i ;
for ( i = 0 ; i < num_fds ; i + + ) {
close ( fds [ i ] ) ;
}
* recvfd = - 1 ;
return n ;
2008-02-21 16:14:08 +01:00
}
2014-12-31 14:26:43 +01:00
* recvfd = fds [ 0 ] ;
2008-02-21 16:14:08 +01:00
}
return ( n ) ;
}
static ssize_t write_fd ( int fd , void * ptr , size_t nbytes , int sendfd )
{
2015-03-03 15:48:46 +01:00
struct msghdr msg = { 0 } ;
2014-12-31 13:03:24 +01:00
size_t bufsize = msghdr_prep_fds ( NULL , NULL , 0 , & sendfd , 1 ) ;
uint8_t buf [ bufsize ] ;
struct iovec iov ;
2014-12-31 14:27:03 +01:00
ssize_t sent ;
2008-02-21 16:14:08 +01:00
2014-12-31 13:03:24 +01:00
msghdr_prep_fds ( & msg , buf , bufsize , & sendfd , 1 ) ;
2008-02-21 16:14:08 +01:00
2014-12-31 13:03:24 +01:00
iov . iov_base = ( void * ) ptr ;
iov . iov_len = nbytes ;
msg . msg_iov = & iov ;
2008-02-21 16:14:08 +01:00
msg . msg_iovlen = 1 ;
2014-12-31 14:27:03 +01:00
do {
sent = sendmsg ( fd , & msg , 0 ) ;
} while ( ( sent = = - 1 ) & & ( errno = = EINTR ) ) ;
return sent ;
2008-02-21 16:14:08 +01:00
}
2013-02-18 09:59:08 +01:00
static void aio_child_cleanup ( struct tevent_context * event_ctx ,
2013-02-18 10:18:29 +01:00
struct tevent_timer * te ,
2009-01-05 10:22:50 +01:00
struct timeval now ,
2008-02-21 16:14:08 +01:00
void * private_data )
{
struct aio_child_list * list = talloc_get_type_abort (
private_data , struct aio_child_list ) ;
struct aio_child * child , * next ;
TALLOC_FREE ( list - > cleanup_event ) ;
for ( child = list - > children ; child ! = NULL ; child = next ) {
next = child - > next ;
2012-07-09 11:10:30 +02:00
if ( child - > busy ) {
2008-02-21 16:14:08 +01:00
DEBUG ( 10 , ( " child %d currently active \n " ,
( int ) child - > pid ) ) ;
continue ;
}
if ( child - > dont_delete ) {
DEBUG ( 10 , ( " Child %d was active since last cleanup \n " ,
( int ) child - > pid ) ) ;
child - > dont_delete = false ;
continue ;
}
DEBUG ( 10 , ( " Child %d idle for more than 30 seconds, "
" deleting \n " , ( int ) child - > pid ) ) ;
TALLOC_FREE ( child ) ;
2011-01-13 15:59:18 +01:00
child = next ;
2008-02-21 16:14:08 +01:00
}
if ( list - > children ! = NULL ) {
/*
* Re - schedule the next cleanup round
*/
2018-08-21 11:06:16 -07:00
list - > cleanup_event = tevent_add_timer ( global_event_context ( ) , list ,
2009-01-05 10:22:50 +01:00
timeval_add ( & now , 30 , 0 ) ,
2008-02-21 16:14:08 +01:00
aio_child_cleanup , list ) ;
}
}
static struct aio_child_list * init_aio_children ( struct vfs_handle_struct * handle )
{
2017-12-07 20:53:18 +01:00
struct aio_fork_config * config ;
struct aio_child_list * children ;
2008-02-21 16:14:08 +01:00
2017-12-07 20:53:18 +01:00
SMB_VFS_HANDLE_GET_DATA ( handle , config , struct aio_fork_config ,
return NULL ) ;
2008-02-21 16:14:08 +01:00
2017-12-07 20:53:18 +01:00
if ( config - > children = = NULL ) {
config - > children = talloc_zero ( config , struct aio_child_list ) ;
if ( config - > children = = NULL ) {
2008-02-21 16:14:08 +01:00
return NULL ;
}
}
2017-12-07 20:53:18 +01:00
children = config - > children ;
2008-02-21 16:14:08 +01:00
/*
* Regardless of whether the child_list had been around or not , make
* sure that we have a cleanup timed event . This timed event will
* delete itself when it finds that no children are around anymore .
*/
2017-12-07 20:53:18 +01:00
if ( children - > cleanup_event = = NULL ) {
children - > cleanup_event =
2018-08-21 11:06:16 -07:00
tevent_add_timer ( global_event_context ( ) , children ,
2017-12-07 20:53:18 +01:00
timeval_current_ofs ( 30 , 0 ) ,
aio_child_cleanup , children ) ;
if ( children - > cleanup_event = = NULL ) {
TALLOC_FREE ( config - > children ) ;
2008-02-21 16:14:08 +01:00
return NULL ;
}
}
2017-12-07 20:53:18 +01:00
return children ;
2008-02-21 16:14:08 +01:00
}
static void aio_child_loop ( int sockfd , struct mmap_area * map )
{
while ( true ) {
int fd = - 1 ;
ssize_t ret ;
struct rw_cmd cmd_struct ;
struct rw_ret ret_struct ;
2016-02-26 09:59:23 +01:00
struct timespec start , end ;
2008-02-21 16:14:08 +01:00
ret = read_fd ( sockfd , & cmd_struct , sizeof ( cmd_struct ) , & fd ) ;
if ( ret ! = sizeof ( cmd_struct ) ) {
DEBUG ( 10 , ( " read_fd returned %d: %s \n " , ( int ) ret ,
strerror ( errno ) ) ) ;
exit ( 1 ) ;
}
DEBUG ( 10 , ( " aio_child_loop: %s %d bytes at %d from fd %d \n " ,
2012-07-13 13:59:52 +02:00
cmd_type_str ( cmd_struct . cmd ) ,
2008-02-21 16:14:08 +01:00
( int ) cmd_struct . n , ( int ) cmd_struct . offset , fd ) ) ;
2012-08-21 19:22:37 +10:00
if ( cmd_struct . erratic_testing_mode ) {
2008-02-21 16:14:08 +01:00
/*
2012-08-21 08:16:24 +10:00
* For developer testing , we want erratic behaviour for
2008-02-21 16:14:08 +01:00
* async I / O times
*/
uint8_t randval ;
unsigned msecs ;
/*
* use generate_random_buffer , we just forked from a
* common parent state
*/
generate_random_buffer ( & randval , sizeof ( randval ) ) ;
2017-12-11 17:32:40 +01:00
msecs = ( randval % 20 ) + 1 ;
2008-02-21 16:14:08 +01:00
DEBUG ( 10 , ( " delaying for %u msecs \n " , msecs ) ) ;
smb_msleep ( msecs ) ;
}
ZERO_STRUCT ( ret_struct ) ;
2016-03-28 10:19:49 +03:00
PROFILE_TIMESTAMP ( & start ) ;
2016-02-26 09:59:23 +01:00
2012-07-13 13:59:52 +02:00
switch ( cmd_struct . cmd ) {
case READ_CMD :
2020-05-07 12:42:10 -07:00
ret_struct . size = sys_pread_full (
2015-04-10 11:10:27 +02:00
fd , discard_const ( map - > ptr ) , cmd_struct . n ,
2008-02-21 16:14:08 +01:00
cmd_struct . offset ) ;
2010-06-04 21:00:24 -07:00
#if 0
/* This breaks "make test" when run with aio_fork module. */
2012-08-21 08:16:24 +10:00
# ifdef DEVELOPER
2009-09-14 03:21:30 +02:00
ret_struct . size = MAX ( 1 , ret_struct . size * 0.9 ) ;
2010-06-04 21:00:24 -07:00
# endif
2009-09-14 03:21:30 +02:00
# endif
2012-07-13 13:59:52 +02:00
break ;
case WRITE_CMD :
2020-05-07 12:42:53 -07:00
ret_struct . size = sys_pwrite_full (
2015-04-10 11:10:27 +02:00
fd , discard_const ( map - > ptr ) , cmd_struct . n ,
2008-02-21 16:14:08 +01:00
cmd_struct . offset ) ;
2012-07-13 13:59:52 +02:00
break ;
2012-07-13 14:05:11 +02:00
case FSYNC_CMD :
ret_struct . size = fsync ( fd ) ;
break ;
2012-07-13 13:59:52 +02:00
default :
ret_struct . size = - 1 ;
errno = EINVAL ;
2008-02-21 16:14:08 +01:00
}
2016-03-28 10:19:49 +03:00
PROFILE_TIMESTAMP ( & end ) ;
2016-02-26 09:59:23 +01:00
ret_struct . duration = nsec_time_diff ( & end , & start ) ;
2008-02-21 16:14:08 +01:00
DEBUG ( 10 , ( " aio_child_loop: syscall returned %d \n " ,
( int ) ret_struct . size ) ) ;
if ( ret_struct . size = = - 1 ) {
ret_struct . ret_errno = errno ;
}
2009-05-18 09:36:16 +02:00
/*
* Close the fd before telling our parent we ' re done . The
* parent might close and re - open the file very quickly , and
* with system - level share modes ( GPFS ) we would get an
* unjustified SHARING_VIOLATION .
*/
close ( fd ) ;
2008-02-21 16:14:08 +01:00
ret = write_data ( sockfd , ( char * ) & ret_struct ,
sizeof ( ret_struct ) ) ;
if ( ret ! = sizeof ( ret_struct ) ) {
DEBUG ( 10 , ( " could not write ret_struct: %s \n " ,
strerror ( errno ) ) ) ;
exit ( 2 ) ;
}
}
}
static int aio_child_destructor ( struct aio_child * child )
{
2011-01-13 16:04:36 +01:00
char c = 0 ;
2012-07-09 11:10:30 +02:00
SMB_ASSERT ( ! child - > busy ) ;
2011-01-13 16:04:36 +01:00
DEBUG ( 10 , ( " aio_child_destructor: removing child %d on fd %d \n " ,
2015-05-06 16:25:51 +02:00
( int ) child - > pid , child - > sockfd ) ) ;
2011-01-13 16:04:36 +01:00
/*
* closing the sockfd makes the child not return from recvmsg ( ) on RHEL
* 5.5 so instead force the child to exit by writing bad data to it
*/
2016-04-05 22:21:19 +02:00
sys_write_v ( child - > sockfd , & c , sizeof ( c ) ) ;
2008-02-21 16:14:08 +01:00
close ( child - > sockfd ) ;
DLIST_REMOVE ( child - > list - > children , child ) ;
return 0 ;
}
2009-05-18 09:49:23 +02:00
/*
* We have to close all fd ' s in open files , we might incorrectly hold a system
* level share mode on a file .
*/
static struct files_struct * close_fsp_fd ( struct files_struct * fsp ,
void * private_data )
{
2020-10-03 21:24:29 +02:00
if ( ( fsp - > fh ! = NULL ) & & ( fsp_get_pathref_fd ( fsp ) ! = - 1 ) ) {
close ( fsp_get_pathref_fd ( fsp ) ) ;
2020-09-26 21:46:51 +02:00
fsp_set_fd ( fsp , - 1 ) ;
2009-05-18 09:49:23 +02:00
}
return NULL ;
}
2012-07-09 09:00:55 +02:00
static int create_aio_child ( struct smbd_server_connection * sconn ,
struct aio_child_list * children ,
size_t map_size ,
struct aio_child * * presult )
2008-02-21 16:14:08 +01:00
{
struct aio_child * result ;
int fdpair [ 2 ] ;
2012-07-09 09:00:55 +02:00
int ret ;
2008-02-21 16:14:08 +01:00
fdpair [ 0 ] = fdpair [ 1 ] = - 1 ;
2011-06-07 11:44:43 +10:00
result = talloc_zero ( children , struct aio_child ) ;
2012-07-09 09:00:55 +02:00
if ( result = = NULL ) {
return ENOMEM ;
}
2008-02-21 16:14:08 +01:00
if ( socketpair ( AF_UNIX , SOCK_STREAM , 0 , fdpair ) = = - 1 ) {
2012-07-09 09:00:55 +02:00
ret = errno ;
2008-02-21 16:14:08 +01:00
DEBUG ( 10 , ( " socketpair() failed: %s \n " , strerror ( errno ) ) ) ;
goto fail ;
}
DEBUG ( 10 , ( " fdpair = %d/%d \n " , fdpair [ 0 ] , fdpair [ 1 ] ) ) ;
result - > map = mmap_area_init ( result , map_size ) ;
if ( result - > map = = NULL ) {
2012-07-09 09:00:55 +02:00
ret = errno ;
2008-02-21 16:14:08 +01:00
DEBUG ( 0 , ( " Could not create mmap area \n " ) ) ;
goto fail ;
}
2012-03-24 20:17:08 +01:00
result - > pid = fork ( ) ;
2008-02-21 16:14:08 +01:00
if ( result - > pid = = - 1 ) {
2012-07-09 09:00:55 +02:00
ret = errno ;
2008-02-21 16:14:08 +01:00
DEBUG ( 0 , ( " fork failed: %s \n " , strerror ( errno ) ) ) ;
goto fail ;
}
if ( result - > pid = = 0 ) {
close ( fdpair [ 0 ] ) ;
result - > sockfd = fdpair [ 1 ] ;
2010-09-27 03:53:00 +02:00
files_forall ( sconn , close_fsp_fd , NULL ) ;
2008-02-21 16:14:08 +01:00
aio_child_loop ( result - > sockfd , result - > map ) ;
}
2011-01-13 16:04:36 +01:00
DEBUG ( 10 , ( " Child %d created with sockfd %d \n " ,
2015-05-06 16:25:51 +02:00
( int ) result - > pid , fdpair [ 0 ] ) ) ;
2008-02-21 16:14:08 +01:00
result - > sockfd = fdpair [ 0 ] ;
close ( fdpair [ 1 ] ) ;
result - > list = children ;
DLIST_ADD ( children - > children , result ) ;
talloc_set_destructor ( result , aio_child_destructor ) ;
* presult = result ;
2012-07-09 09:00:55 +02:00
return 0 ;
2008-02-21 16:14:08 +01:00
fail :
if ( fdpair [ 0 ] ! = - 1 ) close ( fdpair [ 0 ] ) ;
if ( fdpair [ 1 ] ! = - 1 ) close ( fdpair [ 1 ] ) ;
TALLOC_FREE ( result ) ;
2012-07-09 09:00:55 +02:00
return ret ;
2008-02-21 16:14:08 +01:00
}
2012-07-09 09:00:55 +02:00
static int get_idle_child ( struct vfs_handle_struct * handle ,
struct aio_child * * pchild )
2008-02-21 16:14:08 +01:00
{
struct aio_child_list * children ;
struct aio_child * child ;
children = init_aio_children ( handle ) ;
if ( children = = NULL ) {
2012-07-09 09:00:55 +02:00
return ENOMEM ;
2008-02-21 16:14:08 +01:00
}
for ( child = children - > children ; child ! = NULL ; child = child - > next ) {
2012-07-09 11:10:30 +02:00
if ( ! child - > busy ) {
2008-02-21 16:14:08 +01:00
break ;
}
}
if ( child = = NULL ) {
2012-07-09 09:00:55 +02:00
int ret ;
2008-02-21 16:14:08 +01:00
DEBUG ( 10 , ( " no idle child found, creating new one \n " ) ) ;
2012-07-09 09:00:55 +02:00
ret = create_aio_child ( handle - > conn - > sconn , children ,
2010-09-27 03:53:00 +02:00
128 * 1024 , & child ) ;
2012-07-09 09:00:55 +02:00
if ( ret ! = 0 ) {
2008-02-21 16:14:08 +01:00
DEBUG ( 10 , ( " create_aio_child failed: %s \n " ,
2012-07-09 09:00:55 +02:00
strerror ( errno ) ) ) ;
2012-07-09 09:00:55 +02:00
return ret ;
2008-02-21 16:14:08 +01:00
}
}
child - > dont_delete = true ;
2012-07-09 11:10:30 +02:00
child - > busy = true ;
2008-02-21 16:14:08 +01:00
* pchild = child ;
2012-07-09 09:00:55 +02:00
return 0 ;
2008-02-21 16:14:08 +01:00
}
2012-07-09 11:10:30 +02:00
struct aio_fork_pread_state {
2008-02-21 16:14:08 +01:00
struct aio_child * child ;
2017-12-08 14:07:06 +01:00
size_t n ;
void * data ;
2008-02-21 16:14:08 +01:00
ssize_t ret ;
2016-02-26 10:54:01 +01:00
struct vfs_aio_state vfs_aio_state ;
2012-07-09 11:10:30 +02:00
} ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
static void aio_fork_pread_done ( struct tevent_req * subreq ) ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
static struct tevent_req * aio_fork_pread_send ( struct vfs_handle_struct * handle ,
TALLOC_CTX * mem_ctx ,
struct tevent_context * ev ,
struct files_struct * fsp ,
void * data ,
size_t n , off_t offset )
2008-02-21 16:14:08 +01:00
{
2012-07-09 11:10:30 +02:00
struct tevent_req * req , * subreq ;
struct aio_fork_pread_state * state ;
2008-02-21 16:14:08 +01:00
struct rw_cmd cmd ;
2012-07-09 11:10:30 +02:00
ssize_t written ;
2012-07-09 09:00:55 +02:00
int err ;
2012-08-21 19:22:37 +10:00
struct aio_fork_config * config ;
2012-08-31 14:45:08 +02:00
2012-08-21 19:22:37 +10:00
SMB_VFS_HANDLE_GET_DATA ( handle , config ,
struct aio_fork_config ,
2012-08-31 14:45:08 +02:00
return NULL ) ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
req = tevent_req_create ( mem_ctx , & state , struct aio_fork_pread_state ) ;
if ( req = = NULL ) {
return NULL ;
}
2017-12-08 14:07:06 +01:00
state - > n = n ;
state - > data = data ;
2012-07-09 11:10:30 +02:00
if ( n > 128 * 1024 ) {
2008-02-21 16:14:08 +01:00
/* TODO: support variable buffers */
2012-07-09 11:10:30 +02:00
tevent_req_error ( req , EINVAL ) ;
return tevent_req_post ( req , ev ) ;
2008-02-21 16:14:08 +01:00
}
2012-07-09 11:10:30 +02:00
err = get_idle_child ( handle , & state - > child ) ;
2012-07-09 09:00:55 +02:00
if ( err ! = 0 ) {
2012-07-09 11:10:30 +02:00
tevent_req_error ( req , err ) ;
return tevent_req_post ( req , ev ) ;
2008-02-21 16:14:08 +01:00
}
ZERO_STRUCT ( cmd ) ;
2012-07-09 11:10:30 +02:00
cmd . n = n ;
cmd . offset = offset ;
2012-07-13 13:59:52 +02:00
cmd . cmd = READ_CMD ;
2012-08-21 19:22:37 +10:00
cmd . erratic_testing_mode = config - > erratic_testing_mode ;
2008-02-21 16:14:08 +01:00
2020-09-26 21:52:52 +02:00
DEBUG ( 10 , ( " sending fd %d to child %d \n " , fsp_get_io_fd ( fsp ) ,
2012-07-09 11:10:30 +02:00
( int ) state - > child - > pid ) ) ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
/*
* Not making this async . We ' re writing into an empty unix
* domain socket . This should never block .
*/
written = write_fd ( state - > child - > sockfd , & cmd , sizeof ( cmd ) ,
2020-09-26 21:52:52 +02:00
fsp_get_io_fd ( fsp ) ) ;
2012-07-09 11:10:30 +02:00
if ( written = = - 1 ) {
err = errno ;
TALLOC_FREE ( state - > child ) ;
DEBUG ( 10 , ( " write_fd failed: %s \n " , strerror ( err ) ) ) ;
tevent_req_error ( req , err ) ;
return tevent_req_post ( req , ev ) ;
2008-02-21 16:14:08 +01:00
}
2012-07-09 11:10:30 +02:00
subreq = read_packet_send ( state , ev , state - > child - > sockfd ,
sizeof ( struct rw_ret ) , NULL , NULL ) ;
if ( tevent_req_nomem ( subreq , req ) ) {
TALLOC_FREE ( state - > child ) ; /* we sent sth down */
return tevent_req_post ( req , ev ) ;
}
tevent_req_set_callback ( subreq , aio_fork_pread_done , req ) ;
return req ;
2008-02-21 16:14:08 +01:00
}
2012-07-09 11:10:30 +02:00
static void aio_fork_pread_done ( struct tevent_req * subreq )
2008-02-21 16:14:08 +01:00
{
2012-07-09 11:10:30 +02:00
struct tevent_req * req = tevent_req_callback_data (
subreq , struct tevent_req ) ;
struct aio_fork_pread_state * state = tevent_req_data (
req , struct aio_fork_pread_state ) ;
ssize_t nread ;
uint8_t * buf ;
int err ;
struct rw_ret * retbuf ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
nread = read_packet_recv ( subreq , talloc_tos ( ) , & buf , & err ) ;
TALLOC_FREE ( subreq ) ;
if ( nread = = - 1 ) {
TALLOC_FREE ( state - > child ) ;
tevent_req_error ( req , err ) ;
return ;
2008-02-21 16:14:08 +01:00
}
2012-07-09 11:10:30 +02:00
retbuf = ( struct rw_ret * ) buf ;
state - > ret = retbuf - > size ;
2016-02-26 10:54:01 +01:00
state - > vfs_aio_state . error = retbuf - > ret_errno ;
2016-02-26 09:59:23 +01:00
state - > vfs_aio_state . duration = retbuf - > duration ;
2017-12-08 14:07:06 +01:00
if ( ( size_t ) state - > ret > state - > n ) {
tevent_req_error ( req , EIO ) ;
state - > child - > busy = false ;
return ;
}
memcpy ( state - > data , state - > child - > map - > ptr , state - > ret ) ;
state - > child - > busy = false ;
2012-07-09 11:10:30 +02:00
tevent_req_done ( req ) ;
2008-02-21 16:14:08 +01:00
}
2016-02-26 10:54:01 +01:00
static ssize_t aio_fork_pread_recv ( struct tevent_req * req ,
struct vfs_aio_state * vfs_aio_state )
2008-02-21 16:14:08 +01:00
{
2012-07-09 11:10:30 +02:00
struct aio_fork_pread_state * state = tevent_req_data (
req , struct aio_fork_pread_state ) ;
2008-02-21 16:14:08 +01:00
2016-02-26 10:54:01 +01:00
if ( tevent_req_is_unix_error ( req , & vfs_aio_state - > error ) ) {
2008-02-21 16:14:08 +01:00
return - 1 ;
}
2016-02-26 10:54:01 +01:00
* vfs_aio_state = state - > vfs_aio_state ;
2012-07-09 11:10:30 +02:00
return state - > ret ;
}
2012-04-12 15:04:08 -07:00
2012-07-09 11:10:30 +02:00
struct aio_fork_pwrite_state {
struct aio_child * child ;
ssize_t ret ;
2016-02-26 10:54:01 +01:00
struct vfs_aio_state vfs_aio_state ;
2012-07-09 11:10:30 +02:00
} ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
static void aio_fork_pwrite_done ( struct tevent_req * subreq ) ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
static struct tevent_req * aio_fork_pwrite_send (
struct vfs_handle_struct * handle , TALLOC_CTX * mem_ctx ,
struct tevent_context * ev , struct files_struct * fsp ,
const void * data , size_t n , off_t offset )
2008-02-21 16:14:08 +01:00
{
2012-07-09 11:10:30 +02:00
struct tevent_req * req , * subreq ;
struct aio_fork_pwrite_state * state ;
struct rw_cmd cmd ;
ssize_t written ;
int err ;
2012-08-21 19:22:37 +10:00
struct aio_fork_config * config ;
SMB_VFS_HANDLE_GET_DATA ( handle , config ,
struct aio_fork_config ,
return NULL ) ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
req = tevent_req_create ( mem_ctx , & state , struct aio_fork_pwrite_state ) ;
if ( req = = NULL ) {
return NULL ;
2008-02-21 16:14:08 +01:00
}
2012-07-09 11:10:30 +02:00
if ( n > 128 * 1024 ) {
/* TODO: support variable buffers */
tevent_req_error ( req , EINVAL ) ;
return tevent_req_post ( req , ev ) ;
}
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
err = get_idle_child ( handle , & state - > child ) ;
if ( err ! = 0 ) {
tevent_req_error ( req , err ) ;
return tevent_req_post ( req , ev ) ;
2008-02-21 16:14:08 +01:00
}
2017-12-08 14:07:47 +01:00
memcpy ( state - > child - > map - > ptr , data , n ) ;
2012-07-09 11:10:30 +02:00
ZERO_STRUCT ( cmd ) ;
cmd . n = n ;
cmd . offset = offset ;
2012-07-13 13:59:52 +02:00
cmd . cmd = WRITE_CMD ;
2012-08-21 19:22:37 +10:00
cmd . erratic_testing_mode = config - > erratic_testing_mode ;
2008-02-21 16:14:08 +01:00
2020-09-26 21:52:52 +02:00
DEBUG ( 10 , ( " sending fd %d to child %d \n " , fsp_get_io_fd ( fsp ) ,
2012-07-09 11:10:30 +02:00
( int ) state - > child - > pid ) ) ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
/*
* Not making this async . We ' re writing into an empty unix
* domain socket . This should never block .
*/
written = write_fd ( state - > child - > sockfd , & cmd , sizeof ( cmd ) ,
2020-09-26 21:52:52 +02:00
fsp_get_io_fd ( fsp ) ) ;
2012-07-09 11:10:30 +02:00
if ( written = = - 1 ) {
err = errno ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
TALLOC_FREE ( state - > child ) ;
2008-02-21 16:14:08 +01:00
2012-07-09 11:10:30 +02:00
DEBUG ( 10 , ( " write_fd failed: %s \n " , strerror ( err ) ) ) ;
tevent_req_error ( req , err ) ;
return tevent_req_post ( req , ev ) ;
}
subreq = read_packet_send ( state , ev , state - > child - > sockfd ,
sizeof ( struct rw_ret ) , NULL , NULL ) ;
if ( tevent_req_nomem ( subreq , req ) ) {
TALLOC_FREE ( state - > child ) ; /* we sent sth down */
return tevent_req_post ( req , ev ) ;
}
tevent_req_set_callback ( subreq , aio_fork_pwrite_done , req ) ;
return req ;
2010-06-04 21:00:24 -07:00
}
2012-07-09 11:10:30 +02:00
static void aio_fork_pwrite_done ( struct tevent_req * subreq )
2010-06-04 21:00:24 -07:00
{
2012-07-09 11:10:30 +02:00
struct tevent_req * req = tevent_req_callback_data (
subreq , struct tevent_req ) ;
struct aio_fork_pwrite_state * state = tevent_req_data (
req , struct aio_fork_pwrite_state ) ;
ssize_t nread ;
uint8_t * buf ;
2012-06-11 11:00:27 +02:00
int err ;
2012-07-09 11:10:30 +02:00
struct rw_ret * retbuf ;
2010-06-04 21:00:24 -07:00
2012-07-09 11:10:30 +02:00
nread = read_packet_recv ( subreq , talloc_tos ( ) , & buf , & err ) ;
TALLOC_FREE ( subreq ) ;
if ( nread = = - 1 ) {
TALLOC_FREE ( state - > child ) ;
tevent_req_error ( req , err ) ;
return ;
2010-06-04 21:00:24 -07:00
}
2012-07-09 11:10:30 +02:00
state - > child - > busy = false ;
2010-06-04 21:00:24 -07:00
2012-07-09 11:10:30 +02:00
retbuf = ( struct rw_ret * ) buf ;
state - > ret = retbuf - > size ;
2016-02-26 10:54:01 +01:00
state - > vfs_aio_state . error = retbuf - > ret_errno ;
2016-02-26 09:59:23 +01:00
state - > vfs_aio_state . duration = retbuf - > duration ;
2012-07-09 11:10:30 +02:00
tevent_req_done ( req ) ;
}
2010-06-04 21:00:24 -07:00
2016-02-26 10:54:01 +01:00
static ssize_t aio_fork_pwrite_recv ( struct tevent_req * req ,
struct vfs_aio_state * vfs_aio_state )
2012-07-09 11:10:30 +02:00
{
struct aio_fork_pwrite_state * state = tevent_req_data (
req , struct aio_fork_pwrite_state ) ;
2010-06-04 21:00:24 -07:00
2016-02-26 10:54:01 +01:00
if ( tevent_req_is_unix_error ( req , & vfs_aio_state - > error ) ) {
2012-07-09 11:10:30 +02:00
return - 1 ;
2010-06-04 21:00:24 -07:00
}
2016-02-26 10:54:01 +01:00
* vfs_aio_state = state - > vfs_aio_state ;
2012-07-09 11:10:30 +02:00
return state - > ret ;
2010-06-04 21:00:24 -07:00
}
2012-07-13 14:05:11 +02:00
struct aio_fork_fsync_state {
struct aio_child * child ;
ssize_t ret ;
2016-02-26 10:54:01 +01:00
struct vfs_aio_state vfs_aio_state ;
2012-07-13 14:05:11 +02:00
} ;
static void aio_fork_fsync_done ( struct tevent_req * subreq ) ;
static struct tevent_req * aio_fork_fsync_send (
struct vfs_handle_struct * handle , TALLOC_CTX * mem_ctx ,
struct tevent_context * ev , struct files_struct * fsp )
{
struct tevent_req * req , * subreq ;
struct aio_fork_fsync_state * state ;
struct rw_cmd cmd ;
ssize_t written ;
int err ;
2012-08-21 19:22:37 +10:00
struct aio_fork_config * config ;
2012-08-31 14:45:08 +02:00
2012-08-21 19:22:37 +10:00
SMB_VFS_HANDLE_GET_DATA ( handle , config ,
struct aio_fork_config ,
2012-08-31 14:45:08 +02:00
return NULL ) ;
2012-07-13 14:05:11 +02:00
req = tevent_req_create ( mem_ctx , & state , struct aio_fork_fsync_state ) ;
if ( req = = NULL ) {
return NULL ;
}
err = get_idle_child ( handle , & state - > child ) ;
if ( err ! = 0 ) {
tevent_req_error ( req , err ) ;
return tevent_req_post ( req , ev ) ;
}
ZERO_STRUCT ( cmd ) ;
cmd . cmd = FSYNC_CMD ;
2012-08-21 19:22:37 +10:00
cmd . erratic_testing_mode = config - > erratic_testing_mode ;
2012-07-13 14:05:11 +02:00
2020-09-26 21:52:52 +02:00
DEBUG ( 10 , ( " sending fd %d to child %d \n " , fsp_get_io_fd ( fsp ) ,
2012-07-13 14:05:11 +02:00
( int ) state - > child - > pid ) ) ;
/*
* Not making this async . We ' re writing into an empty unix
* domain socket . This should never block .
*/
written = write_fd ( state - > child - > sockfd , & cmd , sizeof ( cmd ) ,
2020-09-26 21:52:52 +02:00
fsp_get_io_fd ( fsp ) ) ;
2012-07-13 14:05:11 +02:00
if ( written = = - 1 ) {
err = errno ;
TALLOC_FREE ( state - > child ) ;
DEBUG ( 10 , ( " write_fd failed: %s \n " , strerror ( err ) ) ) ;
tevent_req_error ( req , err ) ;
return tevent_req_post ( req , ev ) ;
}
subreq = read_packet_send ( state , ev , state - > child - > sockfd ,
sizeof ( struct rw_ret ) , NULL , NULL ) ;
if ( tevent_req_nomem ( subreq , req ) ) {
TALLOC_FREE ( state - > child ) ; /* we sent sth down */
return tevent_req_post ( req , ev ) ;
}
tevent_req_set_callback ( subreq , aio_fork_fsync_done , req ) ;
return req ;
}
static void aio_fork_fsync_done ( struct tevent_req * subreq )
{
struct tevent_req * req = tevent_req_callback_data (
subreq , struct tevent_req ) ;
struct aio_fork_fsync_state * state = tevent_req_data (
req , struct aio_fork_fsync_state ) ;
ssize_t nread ;
uint8_t * buf ;
int err ;
struct rw_ret * retbuf ;
nread = read_packet_recv ( subreq , talloc_tos ( ) , & buf , & err ) ;
TALLOC_FREE ( subreq ) ;
if ( nread = = - 1 ) {
TALLOC_FREE ( state - > child ) ;
tevent_req_error ( req , err ) ;
return ;
}
state - > child - > busy = false ;
retbuf = ( struct rw_ret * ) buf ;
state - > ret = retbuf - > size ;
2016-02-26 10:54:01 +01:00
state - > vfs_aio_state . error = retbuf - > ret_errno ;
2016-02-26 09:59:23 +01:00
state - > vfs_aio_state . duration = retbuf - > duration ;
2012-07-13 14:05:11 +02:00
tevent_req_done ( req ) ;
}
2016-02-26 10:54:01 +01:00
static int aio_fork_fsync_recv ( struct tevent_req * req ,
struct vfs_aio_state * vfs_aio_state )
2012-07-13 14:05:11 +02:00
{
struct aio_fork_fsync_state * state = tevent_req_data (
req , struct aio_fork_fsync_state ) ;
2016-02-26 10:54:01 +01:00
if ( tevent_req_is_unix_error ( req , & vfs_aio_state - > error ) ) {
2012-07-13 14:05:11 +02:00
return - 1 ;
}
2016-02-26 10:54:01 +01:00
* vfs_aio_state = state - > vfs_aio_state ;
2012-07-13 14:05:11 +02:00
return state - > ret ;
}
2012-04-08 21:49:59 +02:00
static int aio_fork_connect ( vfs_handle_struct * handle , const char * service ,
const char * user )
{
2012-08-21 19:22:37 +10:00
int ret ;
struct aio_fork_config * config ;
ret = SMB_VFS_NEXT_CONNECT ( handle , service , user ) ;
if ( ret < 0 ) {
return ret ;
}
config = talloc_zero ( handle - > conn , struct aio_fork_config ) ;
if ( ! config ) {
SMB_VFS_NEXT_DISCONNECT ( handle ) ;
DEBUG ( 0 , ( " talloc_zero() failed \n " ) ) ;
return - 1 ;
}
config - > erratic_testing_mode = lp_parm_bool ( SNUM ( handle - > conn ) , " vfs_aio_fork " ,
" erratic_testing_mode " , false ) ;
SMB_VFS_HANDLE_SET_DATA ( handle , config ,
NULL , struct aio_fork_config ,
return - 1 ) ;
return 0 ;
2012-04-08 21:49:59 +02:00
}
2009-07-23 20:28:58 -04:00
static struct vfs_fn_pointers vfs_aio_fork_fns = {
2012-04-08 21:49:59 +02:00
. connect_fn = aio_fork_connect ,
2012-07-09 11:10:30 +02:00
. pread_send_fn = aio_fork_pread_send ,
. pread_recv_fn = aio_fork_pread_recv ,
. pwrite_send_fn = aio_fork_pwrite_send ,
. pwrite_recv_fn = aio_fork_pwrite_recv ,
2012-07-13 14:05:11 +02:00
. fsync_send_fn = aio_fork_fsync_send ,
. fsync_recv_fn = aio_fork_fsync_recv ,
2008-02-21 16:14:08 +01:00
} ;
2017-12-15 15:32:12 -07:00
static_decl_vfs ;
2017-04-20 12:24:43 -07:00
NTSTATUS vfs_aio_fork_init ( TALLOC_CTX * ctx )
2008-02-21 16:14:08 +01:00
{
return smb_register_vfs ( SMB_VFS_INTERFACE_VERSION ,
2009-07-23 20:28:58 -04:00
" aio_fork " , & vfs_aio_fork_fns ) ;
2008-02-21 16:14:08 +01:00
}