2005-08-11 16:25:23 -04:00
/*
* linux / net / sunrpc / xprtsock . c
*
* Client - side transport implementation for sockets .
*
* TCP callback races fixes ( C ) 1998 Red Hat Software < alan @ redhat . com >
* TCP send fixes ( C ) 1998 Red Hat Software < alan @ redhat . com >
* TCP NFS related read + write fixes
* ( C ) 1999 Dave Airlie , University of Limerick , Ireland < airlied @ linux . ie >
*
* Rewrite of larges part of the code in order to stabilize TCP stuff .
* Fix behaviour when socket buffer is full .
* ( C ) 1999 Trond Myklebust < trond . myklebust @ fys . uio . no >
2005-08-11 16:25:47 -04:00
*
* IP socket transport implementation , ( C ) 2005 Chuck Lever < cel @ netapp . com >
2005-08-11 16:25:23 -04:00
*/
# include <linux/types.h>
# include <linux/slab.h>
# include <linux/capability.h>
# include <linux/pagemap.h>
# include <linux/errno.h>
# include <linux/socket.h>
# include <linux/in.h>
# include <linux/net.h>
# include <linux/mm.h>
# include <linux/udp.h>
# include <linux/tcp.h>
# include <linux/sunrpc/clnt.h>
2006-01-03 09:55:49 +01:00
# include <linux/sunrpc/sched.h>
2005-08-11 16:25:23 -04:00
# include <linux/file.h>
# include <net/sock.h>
# include <net/checksum.h>
# include <net/udp.h>
# include <net/tcp.h>
2005-11-01 12:24:48 -05:00
/*
* xprtsock tunables
*/
unsigned int xprt_udp_slot_table_entries = RPC_DEF_SLOT_TABLE ;
unsigned int xprt_tcp_slot_table_entries = RPC_DEF_SLOT_TABLE ;
unsigned int xprt_min_resvport = RPC_DEF_MIN_RESVPORT ;
unsigned int xprt_max_resvport = RPC_DEF_MAX_RESVPORT ;
2006-12-05 16:35:54 -05:00
/*
* We can register our own files under / proc / sys / sunrpc by
* calling register_sysctl_table ( ) again . The files in that
* directory become the union of all files registered there .
*
* We simply need to make sure that we don ' t collide with
* someone else ' s file names !
*/
# ifdef RPC_DEBUG
static unsigned int min_slot_table_size = RPC_MIN_SLOT_TABLE ;
static unsigned int max_slot_table_size = RPC_MAX_SLOT_TABLE ;
static unsigned int xprt_min_resvport_limit = RPC_MIN_RESVPORT ;
static unsigned int xprt_max_resvport_limit = RPC_MAX_RESVPORT ;
static struct ctl_table_header * sunrpc_table_header ;
/*
* FIXME : changing the UDP slot table size should also resize the UDP
* socket buffers for existing UDP transports
*/
static ctl_table xs_tunables_table [ ] = {
{
. ctl_name = CTL_SLOTTABLE_UDP ,
. procname = " udp_slot_table_entries " ,
. data = & xprt_udp_slot_table_entries ,
. maxlen = sizeof ( unsigned int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_minmax ,
. strategy = & sysctl_intvec ,
. extra1 = & min_slot_table_size ,
. extra2 = & max_slot_table_size
} ,
{
. ctl_name = CTL_SLOTTABLE_TCP ,
. procname = " tcp_slot_table_entries " ,
. data = & xprt_tcp_slot_table_entries ,
. maxlen = sizeof ( unsigned int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_minmax ,
. strategy = & sysctl_intvec ,
. extra1 = & min_slot_table_size ,
. extra2 = & max_slot_table_size
} ,
{
. ctl_name = CTL_MIN_RESVPORT ,
. procname = " min_resvport " ,
. data = & xprt_min_resvport ,
. maxlen = sizeof ( unsigned int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_minmax ,
. strategy = & sysctl_intvec ,
. extra1 = & xprt_min_resvport_limit ,
. extra2 = & xprt_max_resvport_limit
} ,
{
. ctl_name = CTL_MAX_RESVPORT ,
. procname = " max_resvport " ,
. data = & xprt_max_resvport ,
. maxlen = sizeof ( unsigned int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_minmax ,
. strategy = & sysctl_intvec ,
. extra1 = & xprt_min_resvport_limit ,
. extra2 = & xprt_max_resvport_limit
} ,
{
. ctl_name = 0 ,
} ,
} ;
static ctl_table sunrpc_table [ ] = {
{
. ctl_name = CTL_SUNRPC ,
. procname = " sunrpc " ,
. mode = 0555 ,
. child = xs_tunables_table
} ,
{
. ctl_name = 0 ,
} ,
} ;
# endif
2005-08-11 16:25:56 -04:00
/*
* How many times to try sending a request on a socket before waiting
* for the socket buffer to clear .
*/
# define XS_SENDMSG_RETRY (10U)
2005-08-25 16:25:55 -07:00
/*
* Time out for an RPC UDP socket connect . UDP socket connects are
* synchronous , but we set a timeout anyway in case of resource
* exhaustion on the local host .
*/
# define XS_UDP_CONN_TO (5U * HZ)
/*
* Wait duration for an RPC TCP connection to be established . Solaris
* NFS over TCP uses 60 seconds , for example , which is in line with how
* long a server takes to reboot .
*/
# define XS_TCP_CONN_TO (60U * HZ)
/*
* Wait duration for a reply from the RPC portmapper .
*/
# define XS_BIND_TO (60U * HZ)
/*
* Delay if a UDP socket connect error occurs . This is most likely some
* kind of resource problem on the local host .
*/
# define XS_UDP_REEST_TO (2U * HZ)
/*
* The reestablish timeout allows clients to delay for a bit before attempting
* to reconnect to a server that just dropped our connection .
*
* We implement an exponential backoff when trying to reestablish a TCP
* transport connection with the server . Some servers like to drop a TCP
* connection when they are overworked , so we start with a short timeout and
* increase over time if the server is down or not responding .
*/
# define XS_TCP_INIT_REEST_TO (3U * HZ)
# define XS_TCP_MAX_REEST_TO (5U * 60 * HZ)
/*
* TCP idle timeout ; client drops the transport socket if it is idle
* for this long . Note that we also timeout UDP sockets to prevent
* holding port numbers when there is no RPC traffic .
*/
# define XS_IDLE_DISC_TO (5U * 60 * HZ)
2005-08-11 16:25:23 -04:00
# ifdef RPC_DEBUG
# undef RPC_DEBUG_DATA
2005-08-11 16:25:26 -04:00
# define RPCDBG_FACILITY RPCDBG_TRANS
2005-08-11 16:25:23 -04:00
# endif
# ifdef RPC_DEBUG_DATA
2005-08-11 16:25:26 -04:00
static void xs_pktdump ( char * msg , u32 * packet , unsigned int count )
2005-08-11 16:25:23 -04:00
{
2005-08-11 16:25:26 -04:00
u8 * buf = ( u8 * ) packet ;
int j ;
2005-08-11 16:25:23 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: %s \n " , msg ) ;
2005-08-11 16:25:23 -04:00
for ( j = 0 ; j < count & & j < 128 ; j + = 4 ) {
if ( ! ( j & 31 ) ) {
if ( j )
dprintk ( " \n " ) ;
dprintk ( " 0x%04x " , j ) ;
}
dprintk ( " %02x%02x%02x%02x " ,
buf [ j ] , buf [ j + 1 ] , buf [ j + 2 ] , buf [ j + 3 ] ) ;
}
dprintk ( " \n " ) ;
}
# else
2005-08-11 16:25:26 -04:00
static inline void xs_pktdump ( char * msg , u32 * packet , unsigned int count )
2005-08-11 16:25:23 -04:00
{
/* NOP */
}
# endif
2006-12-05 16:35:11 -05:00
struct sock_xprt {
struct rpc_xprt xprt ;
2006-12-05 16:35:15 -05:00
/*
* Network layer
*/
struct socket * sock ;
struct sock * inet ;
2006-12-05 16:35:19 -05:00
/*
* State of TCP reply receive
*/
__be32 tcp_fraghdr ,
tcp_xid ;
u32 tcp_offset ,
tcp_reclen ;
unsigned long tcp_copied ,
tcp_flags ;
2006-12-05 16:35:26 -05:00
/*
* Connection of transports
*/
2006-12-07 15:48:15 -05:00
struct delayed_work connect_worker ;
2006-12-05 16:35:26 -05:00
unsigned short port ;
2006-12-05 16:35:30 -05:00
/*
* UDP socket buffer size parameters
*/
size_t rcvsize ,
sndsize ;
2006-12-05 16:35:34 -05:00
/*
* Saved socket callback addresses
*/
void ( * old_data_ready ) ( struct sock * , int ) ;
void ( * old_state_change ) ( struct sock * ) ;
void ( * old_write_space ) ( struct sock * ) ;
2006-12-05 16:35:11 -05:00
} ;
2006-12-05 16:35:23 -05:00
/*
* TCP receive state flags
*/
# define TCP_RCV_LAST_FRAG (1UL << 0)
# define TCP_RCV_COPY_FRAGHDR (1UL << 1)
# define TCP_RCV_COPY_XID (1UL << 2)
# define TCP_RCV_COPY_DATA (1UL << 3)
2006-08-22 20:06:18 -04:00
static void xs_format_peer_addresses ( struct rpc_xprt * xprt )
{
struct sockaddr_in * addr = ( struct sockaddr_in * ) & xprt - > addr ;
char * buf ;
buf = kzalloc ( 20 , GFP_KERNEL ) ;
if ( buf ) {
snprintf ( buf , 20 , " %u.%u.%u.%u " ,
NIPQUAD ( addr - > sin_addr . s_addr ) ) ;
}
xprt - > address_strings [ RPC_DISPLAY_ADDR ] = buf ;
buf = kzalloc ( 8 , GFP_KERNEL ) ;
if ( buf ) {
snprintf ( buf , 8 , " %u " ,
ntohs ( addr - > sin_port ) ) ;
}
xprt - > address_strings [ RPC_DISPLAY_PORT ] = buf ;
if ( xprt - > prot = = IPPROTO_UDP )
xprt - > address_strings [ RPC_DISPLAY_PROTO ] = " udp " ;
else
xprt - > address_strings [ RPC_DISPLAY_PROTO ] = " tcp " ;
buf = kzalloc ( 48 , GFP_KERNEL ) ;
if ( buf ) {
snprintf ( buf , 48 , " addr=%u.%u.%u.%u port=%u proto=%s " ,
NIPQUAD ( addr - > sin_addr . s_addr ) ,
ntohs ( addr - > sin_port ) ,
xprt - > prot = = IPPROTO_UDP ? " udp " : " tcp " ) ;
}
xprt - > address_strings [ RPC_DISPLAY_ALL ] = buf ;
}
static void xs_free_peer_addresses ( struct rpc_xprt * xprt )
{
kfree ( xprt - > address_strings [ RPC_DISPLAY_ADDR ] ) ;
kfree ( xprt - > address_strings [ RPC_DISPLAY_PORT ] ) ;
kfree ( xprt - > address_strings [ RPC_DISPLAY_ALL ] ) ;
}
2005-08-11 16:25:29 -04:00
# define XS_SENDMSG_FLAGS (MSG_DONTWAIT | MSG_NOSIGNAL)
2006-10-17 15:06:22 -04:00
static int xs_send_kvec ( struct socket * sock , struct sockaddr * addr , int addrlen , struct kvec * vec , unsigned int base , int more )
2005-08-11 16:25:29 -04:00
{
struct msghdr msg = {
. msg_name = addr ,
. msg_namelen = addrlen ,
2006-10-17 15:06:22 -04:00
. msg_flags = XS_SENDMSG_FLAGS | ( more ? MSG_MORE : 0 ) ,
} ;
struct kvec iov = {
. iov_base = vec - > iov_base + base ,
. iov_len = vec - > iov_len - base ,
2005-08-11 16:25:29 -04:00
} ;
2006-10-17 15:06:22 -04:00
if ( iov . iov_len ! = 0 )
2005-08-11 16:25:29 -04:00
return kernel_sendmsg ( sock , & msg , & iov , 1 , iov . iov_len ) ;
return kernel_sendmsg ( sock , & msg , NULL , 0 , 0 ) ;
}
2006-10-17 15:06:22 -04:00
static int xs_send_pagedata ( struct socket * sock , struct xdr_buf * xdr , unsigned int base , int more )
2005-08-11 16:25:29 -04:00
{
2006-10-17 15:06:22 -04:00
struct page * * ppage ;
unsigned int remainder ;
int err , sent = 0 ;
remainder = xdr - > page_len - base ;
base + = xdr - > page_base ;
ppage = xdr - > pages + ( base > > PAGE_SHIFT ) ;
base & = ~ PAGE_MASK ;
for ( ; ; ) {
unsigned int len = min_t ( unsigned int , PAGE_SIZE - base , remainder ) ;
int flags = XS_SENDMSG_FLAGS ;
2005-08-11 16:25:29 -04:00
2006-10-17 15:06:22 -04:00
remainder - = len ;
if ( remainder ! = 0 | | more )
flags | = MSG_MORE ;
err = sock - > ops - > sendpage ( sock , * ppage , base , len , flags ) ;
if ( remainder = = 0 | | err ! = len )
break ;
sent + = err ;
ppage + + ;
base = 0 ;
}
if ( sent = = 0 )
return err ;
if ( err > 0 )
sent + = err ;
return sent ;
2005-08-11 16:25:29 -04:00
}
2005-08-11 16:25:26 -04:00
/**
* xs_sendpages - write pages directly to a socket
* @ sock : socket to send on
* @ addr : UDP only - - address of destination
* @ addrlen : UDP only - - length of destination address
* @ xdr : buffer containing this request
* @ base : starting position in the buffer
*
2005-08-11 16:25:23 -04:00
*/
2006-10-17 15:06:22 -04:00
static int xs_sendpages ( struct socket * sock , struct sockaddr * addr , int addrlen , struct xdr_buf * xdr , unsigned int base )
2005-08-11 16:25:23 -04:00
{
2006-10-17 15:06:22 -04:00
unsigned int remainder = xdr - > len - base ;
int err , sent = 0 ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:56 -04:00
if ( unlikely ( ! sock ) )
return - ENOTCONN ;
clear_bit ( SOCK_ASYNC_NOSPACE , & sock - > flags ) ;
2006-10-17 15:06:22 -04:00
if ( base ! = 0 ) {
addr = NULL ;
addrlen = 0 ;
}
2005-08-11 16:25:56 -04:00
2006-10-17 15:06:22 -04:00
if ( base < xdr - > head [ 0 ] . iov_len | | addr ! = NULL ) {
unsigned int len = xdr - > head [ 0 ] . iov_len - base ;
remainder - = len ;
err = xs_send_kvec ( sock , addr , addrlen , & xdr - > head [ 0 ] , base , remainder ! = 0 ) ;
if ( remainder = = 0 | | err ! = len )
2005-08-11 16:25:23 -04:00
goto out ;
2006-10-17 15:06:22 -04:00
sent + = err ;
2005-08-11 16:25:23 -04:00
base = 0 ;
} else
2006-10-17 15:06:22 -04:00
base - = xdr - > head [ 0 ] . iov_len ;
2005-08-11 16:25:23 -04:00
2006-10-17 15:06:22 -04:00
if ( base < xdr - > page_len ) {
unsigned int len = xdr - > page_len - base ;
remainder - = len ;
err = xs_send_pagedata ( sock , xdr , base , remainder ! = 0 ) ;
if ( remainder = = 0 | | err ! = len )
2005-08-11 16:25:23 -04:00
goto out ;
2006-10-17 15:06:22 -04:00
sent + = err ;
2005-08-11 16:25:23 -04:00
base = 0 ;
2006-10-17 15:06:22 -04:00
} else
base - = xdr - > page_len ;
if ( base > = xdr - > tail [ 0 ] . iov_len )
return sent ;
err = xs_send_kvec ( sock , NULL , 0 , & xdr - > tail [ 0 ] , base , 0 ) ;
2005-08-11 16:25:23 -04:00
out :
2006-10-17 15:06:22 -04:00
if ( sent = = 0 )
return err ;
if ( err > 0 )
sent + = err ;
return sent ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:26 -04:00
/**
2005-08-11 16:25:56 -04:00
* xs_nospace - place task on wait queue if transmit was incomplete
* @ task : task to put to sleep
2005-08-11 16:25:26 -04:00
*
2005-08-11 16:25:23 -04:00
*/
2005-08-11 16:25:56 -04:00
static void xs_nospace ( struct rpc_task * task )
2005-08-11 16:25:23 -04:00
{
2005-08-11 16:25:56 -04:00
struct rpc_rqst * req = task - > tk_rqstp ;
struct rpc_xprt * xprt = req - > rq_xprt ;
2006-12-05 16:35:15 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-11 16:25:23 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: %5u xmit incomplete (%u left of %u) \n " ,
2005-08-11 16:25:56 -04:00
task - > tk_pid , req - > rq_slen - req - > rq_bytes_sent ,
req - > rq_slen ) ;
2006-12-05 16:35:15 -05:00
if ( test_bit ( SOCK_ASYNC_NOSPACE , & transport - > sock - > flags ) ) {
2005-08-11 16:25:56 -04:00
/* Protect against races with write_space */
spin_lock_bh ( & xprt - > transport_lock ) ;
/* Don't race with disconnect */
if ( ! xprt_connected ( xprt ) )
task - > tk_status = - ENOTCONN ;
2006-12-05 16:35:15 -05:00
else if ( test_bit ( SOCK_NOSPACE , & transport - > sock - > flags ) )
2005-08-11 16:25:56 -04:00
xprt_wait_for_buffer_space ( task ) ;
spin_unlock_bh ( & xprt - > transport_lock ) ;
} else
/* Keep holding the socket if it is blocked */
rpc_delay ( task , HZ > > 4 ) ;
}
/**
* xs_udp_send_request - write an RPC request to a UDP socket
* @ task : address of RPC task that manages the state of an RPC request
*
* Return values :
* 0 : The request has been sent
* EAGAIN : The socket was blocked , please call again later to
* complete the request
* ENOTCONN : Caller needs to invoke connect logic then call again
* other : Some other error occured , the request was not sent
*/
static int xs_udp_send_request ( struct rpc_task * task )
{
struct rpc_rqst * req = task - > tk_rqstp ;
struct rpc_xprt * xprt = req - > rq_xprt ;
2006-12-05 16:35:15 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-11 16:25:56 -04:00
struct xdr_buf * xdr = & req - > rq_snd_buf ;
int status ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:26 -04:00
xs_pktdump ( " packet data: " ,
2005-08-11 16:25:23 -04:00
req - > rq_svec - > iov_base ,
req - > rq_svec - > iov_len ) ;
2005-08-11 16:25:56 -04:00
req - > rq_xtime = jiffies ;
2006-12-05 16:35:15 -05:00
status = xs_sendpages ( transport - > sock ,
( struct sockaddr * ) & xprt - > addr ,
xprt - > addrlen , xdr ,
req - > rq_bytes_sent ) ;
2005-08-11 16:25:23 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_udp_send_request(%u) = %d \n " ,
2005-08-11 16:25:56 -04:00
xdr - > len - req - > rq_bytes_sent , status ) ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:56 -04:00
if ( likely ( status > = ( int ) req - > rq_slen ) )
return 0 ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:56 -04:00
/* Still some bytes left; set up for a retry later. */
if ( status > 0 )
status = - EAGAIN ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:56 -04:00
switch ( status ) {
case - ENETUNREACH :
case - EPIPE :
2005-08-11 16:25:23 -04:00
case - ECONNREFUSED :
/* When the server has died, an ICMP port unreachable message
2005-08-11 16:25:26 -04:00
* prompts ECONNREFUSED . */
2005-08-11 16:25:23 -04:00
break ;
2005-08-11 16:25:56 -04:00
case - EAGAIN :
xs_nospace ( task ) ;
2005-08-11 16:25:23 -04:00
break ;
default :
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: sendmsg returned unrecognized error %d \n " ,
2005-08-11 16:25:56 -04:00
- status ) ;
2005-08-11 16:25:26 -04:00
break ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:56 -04:00
return status ;
2005-08-11 16:25:23 -04:00
}
2005-08-25 16:25:49 -07:00
static inline void xs_encode_tcp_record_marker ( struct xdr_buf * buf )
{
u32 reclen = buf - > len - sizeof ( rpc_fraghdr ) ;
rpc_fraghdr * base = buf - > head [ 0 ] . iov_base ;
* base = htonl ( RPC_LAST_STREAM_FRAGMENT | reclen ) ;
}
2005-08-11 16:25:26 -04:00
/**
2005-08-11 16:25:56 -04:00
* xs_tcp_send_request - write an RPC request to a TCP socket
2005-08-11 16:25:26 -04:00
* @ task : address of RPC task that manages the state of an RPC request
*
* Return values :
2005-08-11 16:25:56 -04:00
* 0 : The request has been sent
* EAGAIN : The socket was blocked , please call again later to
* complete the request
* ENOTCONN : Caller needs to invoke connect logic then call again
* other : Some other error occured , the request was not sent
2005-08-11 16:25:26 -04:00
*
* XXX : In the case of soft timeouts , should we eventually give up
2005-08-11 16:25:56 -04:00
* if sendmsg is not able to make progress ?
2005-08-11 16:25:26 -04:00
*/
2005-08-11 16:25:56 -04:00
static int xs_tcp_send_request ( struct rpc_task * task )
2005-08-11 16:25:23 -04:00
{
struct rpc_rqst * req = task - > tk_rqstp ;
struct rpc_xprt * xprt = req - > rq_xprt ;
2006-12-05 16:35:15 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-11 16:25:56 -04:00
struct xdr_buf * xdr = & req - > rq_snd_buf ;
2005-08-11 16:25:23 -04:00
int status , retry = 0 ;
2005-08-25 16:25:49 -07:00
xs_encode_tcp_record_marker ( & req - > rq_snd_buf ) ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:56 -04:00
xs_pktdump ( " packet data: " ,
req - > rq_svec - > iov_base ,
req - > rq_svec - > iov_len ) ;
2005-08-11 16:25:23 -04:00
/* Continue transmitting the packet/record. We must be careful
* to cope with writespace callbacks arriving _after_ we have
2005-08-11 16:25:56 -04:00
* called sendmsg ( ) . */
2005-08-11 16:25:23 -04:00
while ( 1 ) {
req - > rq_xtime = jiffies ;
2006-12-05 16:35:15 -05:00
status = xs_sendpages ( transport - > sock ,
NULL , 0 , xdr , req - > rq_bytes_sent ) ;
2005-08-11 16:25:23 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_tcp_send_request(%u) = %d \n " ,
2005-08-11 16:25:56 -04:00
xdr - > len - req - > rq_bytes_sent , status ) ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:56 -04:00
if ( unlikely ( status < 0 ) )
2005-08-11 16:25:23 -04:00
break ;
2005-08-11 16:25:56 -04:00
/* If we've sent the entire packet, immediately
* reset the count of bytes sent . */
req - > rq_bytes_sent + = status ;
2006-03-20 13:44:17 -05:00
task - > tk_bytes_sent + = status ;
2005-08-11 16:25:56 -04:00
if ( likely ( req - > rq_bytes_sent > = req - > rq_slen ) ) {
req - > rq_bytes_sent = 0 ;
return 0 ;
}
2005-08-11 16:25:23 -04:00
status = - EAGAIN ;
2005-08-11 16:25:56 -04:00
if ( retry + + > XS_SENDMSG_RETRY )
2005-08-11 16:25:23 -04:00
break ;
}
2005-08-11 16:25:56 -04:00
switch ( status ) {
case - EAGAIN :
xs_nospace ( task ) ;
break ;
case - ECONNREFUSED :
case - ECONNRESET :
case - ENOTCONN :
case - EPIPE :
status = - ENOTCONN ;
break ;
default :
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: sendmsg returned unrecognized error %d \n " ,
2005-08-11 16:25:56 -04:00
- status ) ;
2005-08-25 16:25:49 -07:00
xprt_disconnect ( xprt ) ;
2005-08-11 16:25:56 -04:00
break ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:56 -04:00
2005-08-11 16:25:23 -04:00
return status ;
}
2006-07-27 17:22:50 -04:00
/**
* xs_tcp_release_xprt - clean up after a tcp transmission
* @ xprt : transport
* @ task : rpc task
*
* This cleans up if an error causes us to abort the transmission of a request .
* In this case , the socket may need to be reset in order to avoid confusing
* the server .
*/
static void xs_tcp_release_xprt ( struct rpc_xprt * xprt , struct rpc_task * task )
{
struct rpc_rqst * req ;
if ( task ! = xprt - > snd_task )
return ;
if ( task = = NULL )
goto out_release ;
req = task - > tk_rqstp ;
if ( req - > rq_bytes_sent = = 0 )
goto out_release ;
if ( req - > rq_bytes_sent = = req - > rq_snd_buf . len )
goto out_release ;
set_bit ( XPRT_CLOSE_WAIT , & task - > tk_xprt - > state ) ;
out_release :
xprt_release_xprt ( xprt , task ) ;
}
2005-08-11 16:25:26 -04:00
/**
* xs_close - close a socket
* @ xprt : transport
*
2005-08-25 16:25:55 -07:00
* This is used when all requests are complete ; ie , no DRC state remains
* on the server we want to save .
2005-08-11 16:25:23 -04:00
*/
2005-08-11 16:25:26 -04:00
static void xs_close ( struct rpc_xprt * xprt )
2005-08-11 16:25:23 -04:00
{
2006-12-05 16:35:15 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
struct socket * sock = transport - > sock ;
struct sock * sk = transport - > inet ;
2005-08-11 16:25:23 -04:00
if ( ! sk )
2006-01-03 09:55:55 +01:00
goto clear_close_wait ;
2005-08-11 16:25:23 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_close xprt %p \n " , xprt ) ;
2005-08-11 16:25:26 -04:00
2005-08-11 16:25:23 -04:00
write_lock_bh ( & sk - > sk_callback_lock ) ;
2006-12-05 16:35:15 -05:00
transport - > inet = NULL ;
transport - > sock = NULL ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:26 -04:00
sk - > sk_user_data = NULL ;
2006-12-05 16:35:34 -05:00
sk - > sk_data_ready = transport - > old_data_ready ;
sk - > sk_state_change = transport - > old_state_change ;
sk - > sk_write_space = transport - > old_write_space ;
2005-08-11 16:25:23 -04:00
write_unlock_bh ( & sk - > sk_callback_lock ) ;
2005-08-11 16:25:26 -04:00
sk - > sk_no_check = 0 ;
2005-08-11 16:25:23 -04:00
sock_release ( sock ) ;
2006-01-03 09:55:55 +01:00
clear_close_wait :
smp_mb__before_clear_bit ( ) ;
clear_bit ( XPRT_CLOSE_WAIT , & xprt - > state ) ;
smp_mb__after_clear_bit ( ) ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:26 -04:00
/**
* xs_destroy - prepare to shutdown a transport
* @ xprt : doomed transport
*
*/
static void xs_destroy ( struct rpc_xprt * xprt )
2005-08-11 16:25:23 -04:00
{
2006-12-05 16:35:26 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_destroy xprt %p \n " , xprt ) ;
2005-08-11 16:25:26 -04:00
2007-06-14 18:00:42 -04:00
cancel_rearming_delayed_work ( & transport - > connect_worker ) ;
2005-08-11 16:25:23 -04:00
xprt_disconnect ( xprt ) ;
2005-08-11 16:25:26 -04:00
xs_close ( xprt ) ;
2006-08-22 20:06:18 -04:00
xs_free_peer_addresses ( xprt ) ;
2005-08-11 16:25:23 -04:00
kfree ( xprt - > slot ) ;
2006-10-17 14:44:27 -04:00
kfree ( xprt ) ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:26 -04:00
static inline struct rpc_xprt * xprt_from_sock ( struct sock * sk )
{
return ( struct rpc_xprt * ) sk - > sk_user_data ;
}
/**
* xs_udp_data_ready - " data ready " callback for UDP sockets
* @ sk : socket with data to read
* @ len : how much data to read
*
2005-08-11 16:25:23 -04:00
*/
2005-08-11 16:25:26 -04:00
static void xs_udp_data_ready ( struct sock * sk , int len )
2005-08-11 16:25:23 -04:00
{
2005-08-11 16:25:26 -04:00
struct rpc_task * task ;
struct rpc_xprt * xprt ;
2005-08-11 16:25:23 -04:00
struct rpc_rqst * rovr ;
2005-08-11 16:25:26 -04:00
struct sk_buff * skb ;
2005-08-11 16:25:23 -04:00
int err , repsize , copied ;
2006-09-26 22:29:38 -07:00
u32 _xid ;
__be32 * xp ;
2005-08-11 16:25:23 -04:00
read_lock ( & sk - > sk_callback_lock ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_udp_data_ready... \n " ) ;
2005-08-11 16:25:26 -04:00
if ( ! ( xprt = xprt_from_sock ( sk ) ) )
2005-08-11 16:25:23 -04:00
goto out ;
if ( ( skb = skb_recv_datagram ( sk , 0 , 1 , & err ) ) = = NULL )
goto out ;
if ( xprt - > shutdown )
goto dropit ;
repsize = skb - > len - sizeof ( struct udphdr ) ;
if ( repsize < 4 ) {
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: impossible RPC reply size %d! \n " , repsize ) ;
2005-08-11 16:25:23 -04:00
goto dropit ;
}
/* Copy the XID from the skb... */
xp = skb_header_pointer ( skb , sizeof ( struct udphdr ) ,
sizeof ( _xid ) , & _xid ) ;
if ( xp = = NULL )
goto dropit ;
/* Look up and lock the request corresponding to the given XID */
2005-08-11 16:25:32 -04:00
spin_lock ( & xprt - > transport_lock ) ;
2005-08-11 16:25:23 -04:00
rovr = xprt_lookup_rqst ( xprt , * xp ) ;
if ( ! rovr )
goto out_unlock ;
task = rovr - > rq_task ;
if ( ( copied = rovr - > rq_private_buf . buflen ) > repsize )
copied = repsize ;
/* Suck it into the iovec, verify checksum if not done by hw. */
if ( csum_partial_copy_to_xdr ( & rovr - > rq_private_buf , skb ) )
goto out_unlock ;
/* Something worked... */
dst_confirm ( skb - > dst ) ;
2005-08-25 16:25:52 -07:00
xprt_adjust_cwnd ( task , copied ) ;
xprt_update_rtt ( task ) ;
xprt_complete_rqst ( task , copied ) ;
2005-08-11 16:25:23 -04:00
out_unlock :
2005-08-11 16:25:32 -04:00
spin_unlock ( & xprt - > transport_lock ) ;
2005-08-11 16:25:23 -04:00
dropit :
skb_free_datagram ( sk , skb ) ;
out :
read_unlock ( & sk - > sk_callback_lock ) ;
}
2006-12-05 16:35:44 -05:00
static inline void xs_tcp_read_fraghdr ( struct rpc_xprt * xprt , struct xdr_skb_reader * desc )
2005-08-11 16:25:23 -04:00
{
2006-12-05 16:35:19 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-11 16:25:23 -04:00
size_t len , used ;
char * p ;
2006-12-05 16:35:19 -05:00
p = ( ( char * ) & transport - > tcp_fraghdr ) + transport - > tcp_offset ;
len = sizeof ( transport - > tcp_fraghdr ) - transport - > tcp_offset ;
2006-12-05 16:35:41 -05:00
used = xdr_skb_read_bits ( desc , p , len ) ;
2006-12-05 16:35:19 -05:00
transport - > tcp_offset + = used ;
2005-08-11 16:25:23 -04:00
if ( used ! = len )
return ;
2005-08-25 16:25:49 -07:00
2006-12-05 16:35:19 -05:00
transport - > tcp_reclen = ntohl ( transport - > tcp_fraghdr ) ;
if ( transport - > tcp_reclen & RPC_LAST_STREAM_FRAGMENT )
2006-12-05 16:35:23 -05:00
transport - > tcp_flags | = TCP_RCV_LAST_FRAG ;
2005-08-11 16:25:23 -04:00
else
2006-12-05 16:35:23 -05:00
transport - > tcp_flags & = ~ TCP_RCV_LAST_FRAG ;
2006-12-05 16:35:19 -05:00
transport - > tcp_reclen & = RPC_FRAGMENT_SIZE_MASK ;
2005-08-25 16:25:49 -07:00
2006-12-05 16:35:23 -05:00
transport - > tcp_flags & = ~ TCP_RCV_COPY_FRAGHDR ;
2006-12-05 16:35:19 -05:00
transport - > tcp_offset = 0 ;
2005-08-25 16:25:49 -07:00
2005-08-11 16:25:23 -04:00
/* Sanity check of the record length */
2006-12-05 16:35:19 -05:00
if ( unlikely ( transport - > tcp_reclen < 4 ) ) {
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: invalid TCP record fragment length \n " ) ;
2005-08-11 16:25:23 -04:00
xprt_disconnect ( xprt ) ;
2005-08-11 16:25:26 -04:00
return ;
2005-08-11 16:25:23 -04:00
}
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: reading TCP record fragment of length %d \n " ,
2006-12-05 16:35:19 -05:00
transport - > tcp_reclen ) ;
2005-08-11 16:25:23 -04:00
}
2006-12-05 16:35:19 -05:00
static void xs_tcp_check_fraghdr ( struct sock_xprt * transport )
2005-08-11 16:25:23 -04:00
{
2006-12-05 16:35:19 -05:00
if ( transport - > tcp_offset = = transport - > tcp_reclen ) {
2006-12-05 16:35:23 -05:00
transport - > tcp_flags | = TCP_RCV_COPY_FRAGHDR ;
2006-12-05 16:35:19 -05:00
transport - > tcp_offset = 0 ;
2006-12-05 16:35:23 -05:00
if ( transport - > tcp_flags & TCP_RCV_LAST_FRAG ) {
transport - > tcp_flags & = ~ TCP_RCV_COPY_DATA ;
transport - > tcp_flags | = TCP_RCV_COPY_XID ;
2006-12-05 16:35:19 -05:00
transport - > tcp_copied = 0 ;
2005-08-11 16:25:23 -04:00
}
}
}
2006-12-05 16:35:44 -05:00
static inline void xs_tcp_read_xid ( struct sock_xprt * transport , struct xdr_skb_reader * desc )
2005-08-11 16:25:23 -04:00
{
size_t len , used ;
char * p ;
2006-12-05 16:35:19 -05:00
len = sizeof ( transport - > tcp_xid ) - transport - > tcp_offset ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: reading XID (%Zu bytes) \n " , len ) ;
2006-12-05 16:35:19 -05:00
p = ( ( char * ) & transport - > tcp_xid ) + transport - > tcp_offset ;
2006-12-05 16:35:41 -05:00
used = xdr_skb_read_bits ( desc , p , len ) ;
2006-12-05 16:35:19 -05:00
transport - > tcp_offset + = used ;
2005-08-11 16:25:23 -04:00
if ( used ! = len )
return ;
2006-12-05 16:35:23 -05:00
transport - > tcp_flags & = ~ TCP_RCV_COPY_XID ;
transport - > tcp_flags | = TCP_RCV_COPY_DATA ;
2006-12-05 16:35:19 -05:00
transport - > tcp_copied = 4 ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: reading reply for XID %08x \n " ,
2006-12-05 16:35:19 -05:00
ntohl ( transport - > tcp_xid ) ) ;
xs_tcp_check_fraghdr ( transport ) ;
2005-08-11 16:25:23 -04:00
}
2006-12-05 16:35:44 -05:00
static inline void xs_tcp_read_request ( struct rpc_xprt * xprt , struct xdr_skb_reader * desc )
2005-08-11 16:25:23 -04:00
{
2006-12-05 16:35:19 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-11 16:25:23 -04:00
struct rpc_rqst * req ;
struct xdr_buf * rcvbuf ;
size_t len ;
ssize_t r ;
/* Find and lock the request corresponding to this xid */
2005-08-11 16:25:32 -04:00
spin_lock ( & xprt - > transport_lock ) ;
2006-12-05 16:35:19 -05:00
req = xprt_lookup_rqst ( xprt , transport - > tcp_xid ) ;
2005-08-11 16:25:23 -04:00
if ( ! req ) {
2006-12-05 16:35:23 -05:00
transport - > tcp_flags & = ~ TCP_RCV_COPY_DATA ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: XID %08x request not found! \n " ,
2006-12-05 16:35:19 -05:00
ntohl ( transport - > tcp_xid ) ) ;
2005-08-11 16:25:32 -04:00
spin_unlock ( & xprt - > transport_lock ) ;
2005-08-11 16:25:23 -04:00
return ;
}
rcvbuf = & req - > rq_private_buf ;
len = desc - > count ;
2006-12-05 16:35:19 -05:00
if ( len > transport - > tcp_reclen - transport - > tcp_offset ) {
2006-12-05 16:35:44 -05:00
struct xdr_skb_reader my_desc ;
2005-08-11 16:25:23 -04:00
2006-12-05 16:35:19 -05:00
len = transport - > tcp_reclen - transport - > tcp_offset ;
2005-08-11 16:25:23 -04:00
memcpy ( & my_desc , desc , sizeof ( my_desc ) ) ;
my_desc . count = len ;
2006-12-05 16:35:19 -05:00
r = xdr_partial_copy_from_skb ( rcvbuf , transport - > tcp_copied ,
2006-12-05 16:35:41 -05:00
& my_desc , xdr_skb_read_bits ) ;
2005-08-11 16:25:23 -04:00
desc - > count - = r ;
desc - > offset + = r ;
} else
2006-12-05 16:35:19 -05:00
r = xdr_partial_copy_from_skb ( rcvbuf , transport - > tcp_copied ,
2006-12-05 16:35:41 -05:00
desc , xdr_skb_read_bits ) ;
2005-08-11 16:25:23 -04:00
if ( r > 0 ) {
2006-12-05 16:35:19 -05:00
transport - > tcp_copied + = r ;
transport - > tcp_offset + = r ;
2005-08-11 16:25:23 -04:00
}
if ( r ! = len ) {
/* Error when copying to the receive buffer,
* usually because we weren ' t able to allocate
* additional buffer pages . All we can do now
2006-12-05 16:35:23 -05:00
* is turn off TCP_RCV_COPY_DATA , so the request
2005-08-11 16:25:23 -04:00
* will not receive any additional updates ,
* and time out .
* Any remaining data from this record will
* be discarded .
*/
2006-12-05 16:35:23 -05:00
transport - > tcp_flags & = ~ TCP_RCV_COPY_DATA ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: XID %08x truncated request \n " ,
2006-12-05 16:35:19 -05:00
ntohl ( transport - > tcp_xid ) ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xprt = %p, tcp_copied = %lu, "
" tcp_offset = %u, tcp_reclen = %u \n " ,
xprt , transport - > tcp_copied ,
transport - > tcp_offset , transport - > tcp_reclen ) ;
2005-08-11 16:25:23 -04:00
goto out ;
}
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: XID %08x read %Zd bytes \n " ,
2006-12-05 16:35:19 -05:00
ntohl ( transport - > tcp_xid ) , r ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xprt = %p, tcp_copied = %lu, tcp_offset = %u, "
" tcp_reclen = %u \n " , xprt , transport - > tcp_copied ,
transport - > tcp_offset , transport - > tcp_reclen ) ;
2006-12-05 16:35:19 -05:00
if ( transport - > tcp_copied = = req - > rq_private_buf . buflen )
2006-12-05 16:35:23 -05:00
transport - > tcp_flags & = ~ TCP_RCV_COPY_DATA ;
2006-12-05 16:35:19 -05:00
else if ( transport - > tcp_offset = = transport - > tcp_reclen ) {
2006-12-05 16:35:23 -05:00
if ( transport - > tcp_flags & TCP_RCV_LAST_FRAG )
transport - > tcp_flags & = ~ TCP_RCV_COPY_DATA ;
2005-08-11 16:25:23 -04:00
}
out :
2006-12-05 16:35:23 -05:00
if ( ! ( transport - > tcp_flags & TCP_RCV_COPY_DATA ) )
2006-12-05 16:35:19 -05:00
xprt_complete_rqst ( req - > rq_task , transport - > tcp_copied ) ;
2005-08-11 16:25:32 -04:00
spin_unlock ( & xprt - > transport_lock ) ;
2006-12-05 16:35:19 -05:00
xs_tcp_check_fraghdr ( transport ) ;
2005-08-11 16:25:23 -04:00
}
2006-12-05 16:35:44 -05:00
static inline void xs_tcp_read_discard ( struct sock_xprt * transport , struct xdr_skb_reader * desc )
2005-08-11 16:25:23 -04:00
{
size_t len ;
2006-12-05 16:35:19 -05:00
len = transport - > tcp_reclen - transport - > tcp_offset ;
2005-08-11 16:25:23 -04:00
if ( len > desc - > count )
len = desc - > count ;
desc - > count - = len ;
desc - > offset + = len ;
2006-12-05 16:35:19 -05:00
transport - > tcp_offset + = len ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: discarded %Zu bytes \n " , len ) ;
2006-12-05 16:35:19 -05:00
xs_tcp_check_fraghdr ( transport ) ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:26 -04:00
static int xs_tcp_data_recv ( read_descriptor_t * rd_desc , struct sk_buff * skb , unsigned int offset , size_t len )
2005-08-11 16:25:23 -04:00
{
struct rpc_xprt * xprt = rd_desc - > arg . data ;
2006-12-05 16:35:19 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2006-12-05 16:35:44 -05:00
struct xdr_skb_reader desc = {
2005-08-11 16:25:23 -04:00
. skb = skb ,
. offset = offset ,
. count = len ,
2005-08-11 16:25:26 -04:00
} ;
2005-08-11 16:25:23 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_tcp_data_recv started \n " ) ;
2005-08-11 16:25:23 -04:00
do {
/* Read in a new fragment marker if necessary */
/* Can we ever really expect to get completely empty fragments? */
2006-12-05 16:35:23 -05:00
if ( transport - > tcp_flags & TCP_RCV_COPY_FRAGHDR ) {
2005-08-11 16:25:26 -04:00
xs_tcp_read_fraghdr ( xprt , & desc ) ;
2005-08-11 16:25:23 -04:00
continue ;
}
/* Read in the xid if necessary */
2006-12-05 16:35:23 -05:00
if ( transport - > tcp_flags & TCP_RCV_COPY_XID ) {
2006-12-05 16:35:19 -05:00
xs_tcp_read_xid ( transport , & desc ) ;
2005-08-11 16:25:23 -04:00
continue ;
}
/* Read in the request data */
2006-12-05 16:35:23 -05:00
if ( transport - > tcp_flags & TCP_RCV_COPY_DATA ) {
2005-08-11 16:25:26 -04:00
xs_tcp_read_request ( xprt , & desc ) ;
2005-08-11 16:25:23 -04:00
continue ;
}
/* Skip over any trailing bytes on short reads */
2006-12-05 16:35:19 -05:00
xs_tcp_read_discard ( transport , & desc ) ;
2005-08-11 16:25:23 -04:00
} while ( desc . count ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_tcp_data_recv done \n " ) ;
2005-08-11 16:25:23 -04:00
return len - desc . count ;
}
2005-08-11 16:25:26 -04:00
/**
* xs_tcp_data_ready - " data ready " callback for TCP sockets
* @ sk : socket with data to read
* @ bytes : how much data to read
*
*/
static void xs_tcp_data_ready ( struct sock * sk , int bytes )
2005-08-11 16:25:23 -04:00
{
struct rpc_xprt * xprt ;
read_descriptor_t rd_desc ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_tcp_data_ready... \n " ) ;
2005-08-11 16:25:23 -04:00
read_lock ( & sk - > sk_callback_lock ) ;
2005-08-11 16:25:26 -04:00
if ( ! ( xprt = xprt_from_sock ( sk ) ) )
2005-08-11 16:25:23 -04:00
goto out ;
if ( xprt - > shutdown )
goto out ;
2005-08-11 16:25:26 -04:00
/* We use rd_desc to pass struct xprt to xs_tcp_data_recv */
2005-08-11 16:25:23 -04:00
rd_desc . arg . data = xprt ;
rd_desc . count = 65536 ;
2005-08-11 16:25:26 -04:00
tcp_read_sock ( sk , & rd_desc , xs_tcp_data_recv ) ;
2005-08-11 16:25:23 -04:00
out :
read_unlock ( & sk - > sk_callback_lock ) ;
}
2005-08-11 16:25:26 -04:00
/**
* xs_tcp_state_change - callback to handle TCP socket state changes
* @ sk : socket whose state has changed
*
*/
static void xs_tcp_state_change ( struct sock * sk )
2005-08-11 16:25:23 -04:00
{
2005-08-11 16:25:26 -04:00
struct rpc_xprt * xprt ;
2005-08-11 16:25:23 -04:00
read_lock ( & sk - > sk_callback_lock ) ;
if ( ! ( xprt = xprt_from_sock ( sk ) ) )
goto out ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_tcp_state_change client %p... \n " , xprt ) ;
dprintk ( " RPC: state %x conn %d dead %d zapped %d \n " ,
sk - > sk_state , xprt_connected ( xprt ) ,
sock_flag ( sk , SOCK_DEAD ) ,
sock_flag ( sk , SOCK_ZAPPED ) ) ;
2005-08-11 16:25:23 -04:00
switch ( sk - > sk_state ) {
case TCP_ESTABLISHED :
2005-08-11 16:25:32 -04:00
spin_lock_bh ( & xprt - > transport_lock ) ;
2005-08-11 16:25:23 -04:00
if ( ! xprt_test_and_set_connected ( xprt ) ) {
2006-12-05 16:35:19 -05:00
struct sock_xprt * transport = container_of ( xprt ,
struct sock_xprt , xprt ) ;
2005-08-11 16:25:23 -04:00
/* Reset TCP record info */
2006-12-05 16:35:19 -05:00
transport - > tcp_offset = 0 ;
transport - > tcp_reclen = 0 ;
transport - > tcp_copied = 0 ;
2006-12-05 16:35:23 -05:00
transport - > tcp_flags =
TCP_RCV_COPY_FRAGHDR | TCP_RCV_COPY_XID ;
2006-12-05 16:35:19 -05:00
2005-08-25 16:25:55 -07:00
xprt - > reestablish_timeout = XS_TCP_INIT_REEST_TO ;
2005-08-11 16:25:44 -04:00
xprt_wake_pending_tasks ( xprt , 0 ) ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:32 -04:00
spin_unlock_bh ( & xprt - > transport_lock ) ;
2005-08-11 16:25:23 -04:00
break ;
case TCP_SYN_SENT :
case TCP_SYN_RECV :
break ;
2006-01-03 09:55:55 +01:00
case TCP_CLOSE_WAIT :
/* Try to schedule an autoclose RPC calls */
set_bit ( XPRT_CLOSE_WAIT , & xprt - > state ) ;
if ( test_and_set_bit ( XPRT_LOCKED , & xprt - > state ) = = 0 )
2007-06-14 18:00:42 -04:00
queue_work ( rpciod_workqueue , & xprt - > task_cleanup ) ;
2005-08-11 16:25:23 -04:00
default :
xprt_disconnect ( xprt ) ;
}
out :
read_unlock ( & sk - > sk_callback_lock ) ;
}
2005-08-11 16:25:26 -04:00
/**
2005-08-11 16:25:50 -04:00
* xs_udp_write_space - callback invoked when socket buffer space
* becomes available
2005-08-11 16:25:26 -04:00
* @ sk : socket whose state has changed
*
2005-08-11 16:25:23 -04:00
* Called when more output buffer space is available for this socket .
* We try not to wake our writers until they can make " significant "
2005-08-11 16:25:50 -04:00
* progress , otherwise we ' ll waste resources thrashing kernel_sendmsg
2005-08-11 16:25:23 -04:00
* with a bunch of small requests .
*/
2005-08-11 16:25:50 -04:00
static void xs_udp_write_space ( struct sock * sk )
2005-08-11 16:25:23 -04:00
{
read_lock ( & sk - > sk_callback_lock ) ;
2005-08-11 16:25:50 -04:00
/* from net/core/sock.c:sock_def_write_space */
if ( sock_writeable ( sk ) ) {
struct socket * sock ;
struct rpc_xprt * xprt ;
if ( unlikely ( ! ( sock = sk - > sk_socket ) ) )
2005-08-11 16:25:23 -04:00
goto out ;
2005-08-11 16:25:50 -04:00
if ( unlikely ( ! ( xprt = xprt_from_sock ( sk ) ) ) )
goto out ;
if ( unlikely ( ! test_and_clear_bit ( SOCK_NOSPACE , & sock - > flags ) ) )
2005-08-11 16:25:23 -04:00
goto out ;
2005-08-11 16:25:50 -04:00
xprt_write_space ( xprt ) ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:50 -04:00
out :
read_unlock ( & sk - > sk_callback_lock ) ;
}
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:50 -04:00
/**
* xs_tcp_write_space - callback invoked when socket buffer space
* becomes available
* @ sk : socket whose state has changed
*
* Called when more output buffer space is available for this socket .
* We try not to wake our writers until they can make " significant "
* progress , otherwise we ' ll waste resources thrashing kernel_sendmsg
* with a bunch of small requests .
*/
static void xs_tcp_write_space ( struct sock * sk )
{
read_lock ( & sk - > sk_callback_lock ) ;
/* from net/core/stream.c:sk_stream_write_space */
if ( sk_stream_wspace ( sk ) > = sk_stream_min_wspace ( sk ) ) {
struct socket * sock ;
struct rpc_xprt * xprt ;
if ( unlikely ( ! ( sock = sk - > sk_socket ) ) )
goto out ;
if ( unlikely ( ! ( xprt = xprt_from_sock ( sk ) ) ) )
goto out ;
if ( unlikely ( ! test_and_clear_bit ( SOCK_NOSPACE , & sock - > flags ) ) )
goto out ;
xprt_write_space ( xprt ) ;
}
out :
2005-08-11 16:25:23 -04:00
read_unlock ( & sk - > sk_callback_lock ) ;
}
2005-08-25 16:25:56 -07:00
static void xs_udp_do_set_buffer_size ( struct rpc_xprt * xprt )
2005-08-11 16:25:23 -04:00
{
2006-12-05 16:35:15 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
struct sock * sk = transport - > inet ;
2005-08-11 16:25:23 -04:00
2006-12-05 16:35:30 -05:00
if ( transport - > rcvsize ) {
2005-08-11 16:25:23 -04:00
sk - > sk_userlocks | = SOCK_RCVBUF_LOCK ;
2006-12-05 16:35:30 -05:00
sk - > sk_rcvbuf = transport - > rcvsize * xprt - > max_reqs * 2 ;
2005-08-11 16:25:23 -04:00
}
2006-12-05 16:35:30 -05:00
if ( transport - > sndsize ) {
2005-08-11 16:25:23 -04:00
sk - > sk_userlocks | = SOCK_SNDBUF_LOCK ;
2006-12-05 16:35:30 -05:00
sk - > sk_sndbuf = transport - > sndsize * xprt - > max_reqs * 2 ;
2005-08-11 16:25:23 -04:00
sk - > sk_write_space ( sk ) ;
}
}
2005-08-25 16:25:49 -07:00
/**
2005-08-25 16:25:56 -07:00
* xs_udp_set_buffer_size - set send and receive limits
2005-08-25 16:25:49 -07:00
* @ xprt : generic transport
2005-08-25 16:25:56 -07:00
* @ sndsize : requested size of send buffer , in bytes
* @ rcvsize : requested size of receive buffer , in bytes
2005-08-25 16:25:49 -07:00
*
2005-08-25 16:25:56 -07:00
* Set socket send and receive buffer size limits .
2005-08-25 16:25:49 -07:00
*/
2005-08-25 16:25:56 -07:00
static void xs_udp_set_buffer_size ( struct rpc_xprt * xprt , size_t sndsize , size_t rcvsize )
2005-08-25 16:25:49 -07:00
{
2006-12-05 16:35:30 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
transport - > sndsize = 0 ;
2005-08-25 16:25:56 -07:00
if ( sndsize )
2006-12-05 16:35:30 -05:00
transport - > sndsize = sndsize + 1024 ;
transport - > rcvsize = 0 ;
2005-08-25 16:25:56 -07:00
if ( rcvsize )
2006-12-05 16:35:30 -05:00
transport - > rcvsize = rcvsize + 1024 ;
2005-08-25 16:25:56 -07:00
xs_udp_do_set_buffer_size ( xprt ) ;
2005-08-25 16:25:49 -07:00
}
2005-08-25 16:25:52 -07:00
/**
* xs_udp_timer - called when a retransmit timeout occurs on a UDP transport
* @ task : task that timed out
*
* Adjust the congestion window after a retransmit timeout has occurred .
*/
static void xs_udp_timer ( struct rpc_task * task )
{
xprt_adjust_cwnd ( task , - ETIMEDOUT ) ;
}
2006-05-25 01:40:49 -04:00
static unsigned short xs_get_random_port ( void )
{
unsigned short range = xprt_max_resvport - xprt_min_resvport ;
unsigned short rand = ( unsigned short ) net_random ( ) % range ;
return rand + xprt_min_resvport ;
}
2006-01-03 09:55:51 +01:00
/**
* xs_set_port - reset the port number in the remote endpoint address
* @ xprt : generic transport
* @ port : new port number
*
*/
static void xs_set_port ( struct rpc_xprt * xprt , unsigned short port )
{
2006-08-22 20:06:19 -04:00
struct sockaddr_in * sap = ( struct sockaddr_in * ) & xprt - > addr ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: setting port for xprt %p to %u \n " , xprt , port ) ;
2006-08-22 20:06:19 -04:00
sap - > sin_port = htons ( port ) ;
2006-01-03 09:55:51 +01:00
}
2006-12-05 16:35:26 -05:00
static int xs_bindresvport ( struct sock_xprt * transport , struct socket * sock )
2005-08-11 16:25:23 -04:00
{
struct sockaddr_in myaddr = {
. sin_family = AF_INET ,
} ;
2005-08-25 16:25:54 -07:00
int err ;
2006-12-05 16:35:26 -05:00
unsigned short port = transport - > port ;
2005-08-11 16:25:23 -04:00
do {
myaddr . sin_port = htons ( port ) ;
2006-08-07 20:58:01 -07:00
err = kernel_bind ( sock , ( struct sockaddr * ) & myaddr ,
2005-08-11 16:25:23 -04:00
sizeof ( myaddr ) ) ;
if ( err = = 0 ) {
2006-12-05 16:35:26 -05:00
transport - > port = port ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_bindresvport bound to port %u \n " ,
2005-08-11 16:25:26 -04:00
port ) ;
2005-08-11 16:25:23 -04:00
return 0 ;
}
2005-08-25 16:25:54 -07:00
if ( port < = xprt_min_resvport )
port = xprt_max_resvport ;
else
port - - ;
2006-12-05 16:35:26 -05:00
} while ( err = = - EADDRINUSE & & port ! = transport - > port ) ;
2005-08-11 16:25:23 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: can't bind to reserved port (%d). \n " , - err ) ;
2005-08-11 16:25:23 -04:00
return err ;
}
2006-12-06 20:35:24 -08:00
# ifdef CONFIG_DEBUG_LOCK_ALLOC
static struct lock_class_key xs_key [ 2 ] ;
static struct lock_class_key xs_slock_key [ 2 ] ;
static inline void xs_reclassify_socket ( struct socket * sock )
{
struct sock * sk = sock - > sk ;
BUG_ON ( sk - > sk_lock . owner ! = NULL ) ;
switch ( sk - > sk_family ) {
case AF_INET :
sock_lock_init_class_and_name ( sk , " slock-AF_INET-NFS " ,
& xs_slock_key [ 0 ] , " sk_lock-AF_INET-NFS " , & xs_key [ 0 ] ) ;
break ;
case AF_INET6 :
sock_lock_init_class_and_name ( sk , " slock-AF_INET6-NFS " ,
& xs_slock_key [ 1 ] , " sk_lock-AF_INET6-NFS " , & xs_key [ 1 ] ) ;
break ;
default :
BUG ( ) ;
}
}
# else
static inline void xs_reclassify_socket ( struct socket * sock )
{
}
# endif
2005-08-11 16:25:53 -04:00
/**
* xs_udp_connect_worker - set up a UDP socket
2006-11-22 14:55:48 +00:00
* @ work : RPC transport to connect
2005-08-11 16:25:53 -04:00
*
* Invoked by a work queue tasklet .
*/
2006-11-22 14:55:48 +00:00
static void xs_udp_connect_worker ( struct work_struct * work )
2005-08-11 16:25:23 -04:00
{
2006-12-07 15:48:15 -05:00
struct sock_xprt * transport =
container_of ( work , struct sock_xprt , connect_worker . work ) ;
2006-12-05 16:35:26 -05:00
struct rpc_xprt * xprt = & transport - > xprt ;
2006-12-05 16:35:15 -05:00
struct socket * sock = transport - > sock ;
2005-08-11 16:25:53 -04:00
int err , status = - EIO ;
2005-08-11 16:25:26 -04:00
2006-08-22 20:06:15 -04:00
if ( xprt - > shutdown | | ! xprt_bound ( xprt ) )
2005-08-11 16:25:53 -04:00
goto out ;
2005-08-11 16:25:26 -04:00
2005-08-11 16:25:53 -04:00
/* Start by resetting any existing state */
xs_close ( xprt ) ;
2005-08-11 16:25:26 -04:00
2005-08-11 16:25:53 -04:00
if ( ( err = sock_create_kern ( PF_INET , SOCK_DGRAM , IPPROTO_UDP , & sock ) ) < 0 ) {
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: can't create UDP transport socket (%d). \n " , - err ) ;
2005-08-11 16:25:53 -04:00
goto out ;
}
2006-12-06 20:35:24 -08:00
xs_reclassify_socket ( sock ) ;
2005-08-11 16:25:26 -04:00
2006-12-05 16:35:26 -05:00
if ( xprt - > resvport & & xs_bindresvport ( transport , sock ) < 0 ) {
2005-08-11 16:25:53 -04:00
sock_release ( sock ) ;
goto out ;
}
2005-08-11 16:25:26 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: worker connecting xprt %p to address: %s \n " ,
2006-12-05 16:35:37 -05:00
xprt , xprt - > address_strings [ RPC_DISPLAY_ALL ] ) ;
2006-08-22 20:06:18 -04:00
2006-12-05 16:35:15 -05:00
if ( ! transport - > inet ) {
2005-08-11 16:25:53 -04:00
struct sock * sk = sock - > sk ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:53 -04:00
write_lock_bh ( & sk - > sk_callback_lock ) ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:53 -04:00
sk - > sk_user_data = xprt ;
2006-12-05 16:35:34 -05:00
transport - > old_data_ready = sk - > sk_data_ready ;
transport - > old_state_change = sk - > sk_state_change ;
transport - > old_write_space = sk - > sk_write_space ;
2005-08-11 16:25:26 -04:00
sk - > sk_data_ready = xs_udp_data_ready ;
2005-08-11 16:25:50 -04:00
sk - > sk_write_space = xs_udp_write_space ;
2005-08-11 16:25:23 -04:00
sk - > sk_no_check = UDP_CSUM_NORCV ;
2005-12-13 16:13:52 -05:00
sk - > sk_allocation = GFP_ATOMIC ;
2005-08-11 16:25:53 -04:00
2005-08-11 16:25:23 -04:00
xprt_set_connected ( xprt ) ;
2005-08-11 16:25:53 -04:00
/* Reset to new socket */
2006-12-05 16:35:15 -05:00
transport - > sock = sock ;
transport - > inet = sk ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:53 -04:00
write_unlock_bh ( & sk - > sk_callback_lock ) ;
}
2005-08-25 16:25:56 -07:00
xs_udp_do_set_buffer_size ( xprt ) ;
2005-08-11 16:25:53 -04:00
status = 0 ;
out :
xprt_wake_pending_tasks ( xprt , status ) ;
xprt_clear_connecting ( xprt ) ;
2005-08-11 16:25:23 -04:00
}
2005-08-25 16:25:55 -07:00
/*
* We need to preserve the port number so the reply cache on the server can
* find our cached RPC replies when we get around to reconnecting .
*/
static void xs_tcp_reuse_connection ( struct rpc_xprt * xprt )
{
int result ;
2006-12-05 16:35:15 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-25 16:25:55 -07:00
struct sockaddr any ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: disconnecting xprt %p to reuse port \n " , xprt ) ;
2005-08-25 16:25:55 -07:00
/*
* Disconnect the transport socket by doing a connect operation
* with AF_UNSPEC . This should return immediately . . .
*/
memset ( & any , 0 , sizeof ( any ) ) ;
any . sa_family = AF_UNSPEC ;
2006-12-05 16:35:15 -05:00
result = kernel_connect ( transport - > sock , & any , sizeof ( any ) , 0 ) ;
2005-08-25 16:25:55 -07:00
if ( result )
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: AF_UNSPEC connect return code %d \n " ,
2005-08-25 16:25:55 -07:00
result ) ;
}
2005-08-11 16:25:26 -04:00
/**
2005-08-11 16:25:53 -04:00
* xs_tcp_connect_worker - connect a TCP socket to a remote endpoint
2006-11-22 14:55:48 +00:00
* @ work : RPC transport to connect
2005-08-11 16:25:26 -04:00
*
* Invoked by a work queue tasklet .
2005-08-11 16:25:23 -04:00
*/
2006-11-22 14:55:48 +00:00
static void xs_tcp_connect_worker ( struct work_struct * work )
2005-08-11 16:25:23 -04:00
{
2006-12-07 15:48:15 -05:00
struct sock_xprt * transport =
container_of ( work , struct sock_xprt , connect_worker . work ) ;
2006-12-05 16:35:26 -05:00
struct rpc_xprt * xprt = & transport - > xprt ;
2006-12-05 16:35:15 -05:00
struct socket * sock = transport - > sock ;
2005-08-11 16:25:53 -04:00
int err , status = - EIO ;
2005-08-11 16:25:23 -04:00
2006-08-22 20:06:15 -04:00
if ( xprt - > shutdown | | ! xprt_bound ( xprt ) )
2005-08-11 16:25:23 -04:00
goto out ;
2006-12-05 16:35:15 -05:00
if ( ! sock ) {
2005-08-25 16:25:55 -07:00
/* start from scratch */
if ( ( err = sock_create_kern ( PF_INET , SOCK_STREAM , IPPROTO_TCP , & sock ) ) < 0 ) {
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: can't create TCP transport "
" socket (%d). \n " , - err ) ;
2005-08-25 16:25:55 -07:00
goto out ;
}
2006-12-06 20:35:24 -08:00
xs_reclassify_socket ( sock ) ;
2005-08-11 16:25:23 -04:00
2006-12-05 16:35:26 -05:00
if ( xprt - > resvport & & xs_bindresvport ( transport , sock ) < 0 ) {
2005-08-25 16:25:55 -07:00
sock_release ( sock ) ;
goto out ;
}
} else
/* "close" the socket, preserving the local port */
xs_tcp_reuse_connection ( xprt ) ;
2005-08-11 16:25:23 -04:00
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: worker connecting xprt %p to address: %s \n " ,
2006-12-05 16:35:37 -05:00
xprt , xprt - > address_strings [ RPC_DISPLAY_ALL ] ) ;
2006-08-22 20:06:18 -04:00
2006-12-05 16:35:15 -05:00
if ( ! transport - > inet ) {
2005-08-11 16:25:53 -04:00
struct sock * sk = sock - > sk ;
write_lock_bh ( & sk - > sk_callback_lock ) ;
sk - > sk_user_data = xprt ;
2006-12-05 16:35:34 -05:00
transport - > old_data_ready = sk - > sk_data_ready ;
transport - > old_state_change = sk - > sk_state_change ;
transport - > old_write_space = sk - > sk_write_space ;
2005-08-11 16:25:53 -04:00
sk - > sk_data_ready = xs_tcp_data_ready ;
sk - > sk_state_change = xs_tcp_state_change ;
sk - > sk_write_space = xs_tcp_write_space ;
2005-12-13 16:13:52 -05:00
sk - > sk_allocation = GFP_ATOMIC ;
2005-08-25 16:25:55 -07:00
/* socket options */
sk - > sk_userlocks | = SOCK_BINDPORT_LOCK ;
sock_reset_flag ( sk , SOCK_LINGER ) ;
tcp_sk ( sk ) - > linger2 = 0 ;
tcp_sk ( sk ) - > nonagle | = TCP_NAGLE_OFF ;
2005-08-11 16:25:53 -04:00
xprt_clear_connected ( xprt ) ;
/* Reset to new socket */
2006-12-05 16:35:15 -05:00
transport - > sock = sock ;
transport - > inet = sk ;
2005-08-11 16:25:53 -04:00
write_unlock_bh ( & sk - > sk_callback_lock ) ;
}
/* Tell the socket layer to start connecting... */
2006-03-20 13:44:16 -05:00
xprt - > stat . connect_count + + ;
xprt - > stat . connect_start = jiffies ;
2006-08-07 20:58:01 -07:00
status = kernel_connect ( sock , ( struct sockaddr * ) & xprt - > addr ,
2006-08-22 20:06:19 -04:00
xprt - > addrlen , O_NONBLOCK ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: %p connect status %d connected %d sock state %d \n " ,
xprt , - status , xprt_connected ( xprt ) ,
sock - > sk - > sk_state ) ;
2005-08-11 16:25:23 -04:00
if ( status < 0 ) {
switch ( status ) {
case - EINPROGRESS :
case - EALREADY :
goto out_clear ;
2005-08-25 16:25:55 -07:00
case - ECONNREFUSED :
case - ECONNRESET :
/* retry with existing socket, after a delay */
break ;
default :
/* get rid of existing socket, and retry */
xs_close ( xprt ) ;
break ;
2005-08-11 16:25:23 -04:00
}
}
out :
2005-08-11 16:25:44 -04:00
xprt_wake_pending_tasks ( xprt , status ) ;
2005-08-11 16:25:23 -04:00
out_clear :
2005-08-11 16:25:38 -04:00
xprt_clear_connecting ( xprt ) ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:26 -04:00
/**
* xs_connect - connect a socket to a remote endpoint
* @ task : address of RPC task that manages state of connect request
*
* TCP : If the remote end dropped the connection , delay reconnecting .
2005-08-25 16:25:55 -07:00
*
* UDP socket connects are synchronous , but we use a work queue anyway
* to guarantee that even unprivileged user processes can set up a
* socket on a privileged port .
*
* If a UDP socket connect fails , the delay behavior here prevents
* retry floods ( hard mounts ) .
2005-08-11 16:25:26 -04:00
*/
static void xs_connect ( struct rpc_task * task )
2005-08-11 16:25:23 -04:00
{
struct rpc_xprt * xprt = task - > tk_xprt ;
2006-12-05 16:35:15 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:53 -04:00
if ( xprt_test_and_set_connecting ( xprt ) )
return ;
2006-12-05 16:35:15 -05:00
if ( transport - > sock ! = NULL ) {
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_connect delayed xprt %p for %lu "
" seconds \n " ,
2005-08-25 16:25:55 -07:00
xprt , xprt - > reestablish_timeout / HZ ) ;
2007-06-14 18:00:42 -04:00
queue_delayed_work ( rpciod_workqueue ,
& transport - > connect_worker ,
xprt - > reestablish_timeout ) ;
2005-08-25 16:25:55 -07:00
xprt - > reestablish_timeout < < = 1 ;
if ( xprt - > reestablish_timeout > XS_TCP_MAX_REEST_TO )
xprt - > reestablish_timeout = XS_TCP_MAX_REEST_TO ;
2005-08-11 16:25:53 -04:00
} else {
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_connect scheduled xprt %p \n " , xprt ) ;
2007-06-14 18:00:42 -04:00
queue_delayed_work ( rpciod_workqueue ,
& transport - > connect_worker , 0 ) ;
2005-08-11 16:25:23 -04:00
}
}
2006-03-20 13:44:16 -05:00
/**
* xs_udp_print_stats - display UDP socket - specifc stats
* @ xprt : rpc_xprt struct containing statistics
* @ seq : output file
*
*/
static void xs_udp_print_stats ( struct rpc_xprt * xprt , struct seq_file * seq )
{
2006-12-05 16:35:26 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2006-03-20 13:44:16 -05:00
seq_printf ( seq , " \t xprt: \t udp %u %lu %lu %lu %lu %Lu %Lu \n " ,
2006-12-05 16:35:26 -05:00
transport - > port ,
2006-03-20 13:44:16 -05:00
xprt - > stat . bind_count ,
xprt - > stat . sends ,
xprt - > stat . recvs ,
xprt - > stat . bad_xids ,
xprt - > stat . req_u ,
xprt - > stat . bklog_u ) ;
}
/**
* xs_tcp_print_stats - display TCP socket - specifc stats
* @ xprt : rpc_xprt struct containing statistics
* @ seq : output file
*
*/
static void xs_tcp_print_stats ( struct rpc_xprt * xprt , struct seq_file * seq )
{
2006-12-05 16:35:26 -05:00
struct sock_xprt * transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2006-03-20 13:44:16 -05:00
long idle_time = 0 ;
if ( xprt_connected ( xprt ) )
idle_time = ( long ) ( jiffies - xprt - > last_used ) / HZ ;
seq_printf ( seq , " \t xprt: \t tcp %u %lu %lu %lu %ld %lu %lu %lu %Lu %Lu \n " ,
2006-12-05 16:35:26 -05:00
transport - > port ,
2006-03-20 13:44:16 -05:00
xprt - > stat . bind_count ,
xprt - > stat . connect_count ,
xprt - > stat . connect_time ,
idle_time ,
xprt - > stat . sends ,
xprt - > stat . recvs ,
xprt - > stat . bad_xids ,
xprt - > stat . req_u ,
xprt - > stat . bklog_u ) ;
}
2005-08-11 16:25:56 -04:00
static struct rpc_xprt_ops xs_udp_ops = {
2005-08-25 16:25:49 -07:00
. set_buffer_size = xs_udp_set_buffer_size ,
2005-08-25 16:25:51 -07:00
. reserve_xprt = xprt_reserve_xprt_cong ,
2005-08-25 16:25:51 -07:00
. release_xprt = xprt_release_xprt_cong ,
2007-03-29 16:48:10 -04:00
. rpcbind = rpcb_getport ,
2006-01-03 09:55:51 +01:00
. set_port = xs_set_port ,
2005-08-11 16:25:56 -04:00
. connect = xs_connect ,
2006-01-03 09:55:49 +01:00
. buf_alloc = rpc_malloc ,
. buf_free = rpc_free ,
2005-08-11 16:25:56 -04:00
. send_request = xs_udp_send_request ,
2005-08-25 16:25:50 -07:00
. set_retrans_timeout = xprt_set_retrans_timeout_rtt ,
2005-08-25 16:25:52 -07:00
. timer = xs_udp_timer ,
2005-08-25 16:25:53 -07:00
. release_request = xprt_release_rqst_cong ,
2005-08-11 16:25:56 -04:00
. close = xs_close ,
. destroy = xs_destroy ,
2006-03-20 13:44:16 -05:00
. print_stats = xs_udp_print_stats ,
2005-08-11 16:25:56 -04:00
} ;
static struct rpc_xprt_ops xs_tcp_ops = {
2005-08-25 16:25:51 -07:00
. reserve_xprt = xprt_reserve_xprt ,
2006-07-27 17:22:50 -04:00
. release_xprt = xs_tcp_release_xprt ,
2007-03-29 16:48:10 -04:00
. rpcbind = rpcb_getport ,
2006-01-03 09:55:51 +01:00
. set_port = xs_set_port ,
2005-08-11 16:25:26 -04:00
. connect = xs_connect ,
2006-01-03 09:55:49 +01:00
. buf_alloc = rpc_malloc ,
. buf_free = rpc_free ,
2005-08-11 16:25:56 -04:00
. send_request = xs_tcp_send_request ,
2005-08-25 16:25:50 -07:00
. set_retrans_timeout = xprt_set_retrans_timeout_def ,
2005-08-11 16:25:26 -04:00
. close = xs_close ,
. destroy = xs_destroy ,
2006-03-20 13:44:16 -05:00
. print_stats = xs_tcp_print_stats ,
2005-08-11 16:25:23 -04:00
} ;
2006-10-17 14:44:27 -04:00
static struct rpc_xprt * xs_setup_xprt ( struct sockaddr * addr , size_t addrlen , unsigned int slot_table_size )
{
struct rpc_xprt * xprt ;
2006-12-05 16:35:11 -05:00
struct sock_xprt * new ;
2006-10-17 14:44:27 -04:00
if ( addrlen > sizeof ( xprt - > addr ) ) {
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_setup_xprt: address too large \n " ) ;
2006-10-17 14:44:27 -04:00
return ERR_PTR ( - EBADF ) ;
}
2006-12-05 16:35:11 -05:00
new = kzalloc ( sizeof ( * new ) , GFP_KERNEL ) ;
if ( new = = NULL ) {
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_setup_xprt: couldn't allocate "
" rpc_xprt \n " ) ;
2006-10-17 14:44:27 -04:00
return ERR_PTR ( - ENOMEM ) ;
}
2006-12-05 16:35:11 -05:00
xprt = & new - > xprt ;
2006-10-17 14:44:27 -04:00
xprt - > max_reqs = slot_table_size ;
xprt - > slot = kcalloc ( xprt - > max_reqs , sizeof ( struct rpc_rqst ) , GFP_KERNEL ) ;
if ( xprt - > slot = = NULL ) {
kfree ( xprt ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: xs_setup_xprt: couldn't allocate slot "
" table \n " ) ;
2006-10-17 14:44:27 -04:00
return ERR_PTR ( - ENOMEM ) ;
}
memcpy ( & xprt - > addr , addr , addrlen ) ;
xprt - > addrlen = addrlen ;
2006-12-05 16:35:26 -05:00
new - > port = xs_get_random_port ( ) ;
2006-10-17 14:44:27 -04:00
return xprt ;
}
2005-08-11 16:25:26 -04:00
/**
* xs_setup_udp - Set up transport to use a UDP socket
2006-10-17 14:44:27 -04:00
* @ addr : address of remote server
* @ addrlen : length of address in bytes
2005-08-11 16:25:26 -04:00
* @ to : timeout parameters
*
*/
2006-10-17 14:44:27 -04:00
struct rpc_xprt * xs_setup_udp ( struct sockaddr * addr , size_t addrlen , struct rpc_timeout * to )
2005-08-11 16:25:23 -04:00
{
2006-10-17 14:44:27 -04:00
struct rpc_xprt * xprt ;
2006-12-05 16:35:26 -05:00
struct sock_xprt * transport ;
2005-08-11 16:25:23 -04:00
2006-10-17 14:44:27 -04:00
xprt = xs_setup_xprt ( addr , addrlen , xprt_udp_slot_table_entries ) ;
if ( IS_ERR ( xprt ) )
return xprt ;
2006-12-05 16:35:26 -05:00
transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-11 16:25:23 -04:00
2006-10-17 14:44:27 -04:00
if ( ntohs ( ( ( struct sockaddr_in * ) addr ) - > sin_port ) ! = 0 )
2006-08-22 20:06:15 -04:00
xprt_set_bound ( xprt ) ;
xprt - > prot = IPPROTO_UDP ;
2005-08-25 16:25:49 -07:00
xprt - > tsh_size = 0 ;
2005-08-11 16:25:23 -04:00
/* XXX: header size can vary due to auth type, IPv6, etc. */
xprt - > max_payload = ( 1U < < 16 ) - ( MAX_HEADER < < 3 ) ;
2006-12-07 15:48:15 -05:00
INIT_DELAYED_WORK ( & transport - > connect_worker , xs_udp_connect_worker ) ;
2005-08-25 16:25:55 -07:00
xprt - > bind_timeout = XS_BIND_TO ;
xprt - > connect_timeout = XS_UDP_CONN_TO ;
xprt - > reestablish_timeout = XS_UDP_REEST_TO ;
xprt - > idle_timeout = XS_IDLE_DISC_TO ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:56 -04:00
xprt - > ops = & xs_udp_ops ;
2005-08-11 16:25:23 -04:00
if ( to )
xprt - > timeout = * to ;
else
2005-08-11 16:25:26 -04:00
xprt_set_timeout ( & xprt - > timeout , 5 , 5 * HZ ) ;
2005-08-11 16:25:23 -04:00
2006-08-22 20:06:18 -04:00
xs_format_peer_addresses ( xprt ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: set up transport to address %s \n " ,
2006-12-05 16:35:37 -05:00
xprt - > address_strings [ RPC_DISPLAY_ALL ] ) ;
2006-08-22 20:06:18 -04:00
2006-10-17 14:44:27 -04:00
return xprt ;
2005-08-11 16:25:23 -04:00
}
2005-08-11 16:25:26 -04:00
/**
* xs_setup_tcp - Set up transport to use a TCP socket
2006-10-17 14:44:27 -04:00
* @ addr : address of remote server
* @ addrlen : length of address in bytes
2005-08-11 16:25:26 -04:00
* @ to : timeout parameters
*
*/
2006-10-17 14:44:27 -04:00
struct rpc_xprt * xs_setup_tcp ( struct sockaddr * addr , size_t addrlen , struct rpc_timeout * to )
2005-08-11 16:25:23 -04:00
{
2006-10-17 14:44:27 -04:00
struct rpc_xprt * xprt ;
2006-12-05 16:35:26 -05:00
struct sock_xprt * transport ;
2005-08-11 16:25:23 -04:00
2006-10-17 14:44:27 -04:00
xprt = xs_setup_xprt ( addr , addrlen , xprt_tcp_slot_table_entries ) ;
if ( IS_ERR ( xprt ) )
return xprt ;
2006-12-05 16:35:26 -05:00
transport = container_of ( xprt , struct sock_xprt , xprt ) ;
2005-08-11 16:25:23 -04:00
2006-10-17 14:44:27 -04:00
if ( ntohs ( ( ( struct sockaddr_in * ) addr ) - > sin_port ) ! = 0 )
2006-08-22 20:06:15 -04:00
xprt_set_bound ( xprt ) ;
xprt - > prot = IPPROTO_TCP ;
2005-08-25 16:25:49 -07:00
xprt - > tsh_size = sizeof ( rpc_fraghdr ) / sizeof ( u32 ) ;
xprt - > max_payload = RPC_MAX_FRAGMENT_SIZE ;
2005-08-11 16:25:23 -04:00
2006-12-07 15:48:15 -05:00
INIT_DELAYED_WORK ( & transport - > connect_worker , xs_tcp_connect_worker ) ;
2005-08-25 16:25:55 -07:00
xprt - > bind_timeout = XS_BIND_TO ;
xprt - > connect_timeout = XS_TCP_CONN_TO ;
xprt - > reestablish_timeout = XS_TCP_INIT_REEST_TO ;
xprt - > idle_timeout = XS_IDLE_DISC_TO ;
2005-08-11 16:25:23 -04:00
2005-08-11 16:25:56 -04:00
xprt - > ops = & xs_tcp_ops ;
2005-08-11 16:25:23 -04:00
if ( to )
xprt - > timeout = * to ;
else
2005-08-11 16:25:26 -04:00
xprt_set_timeout ( & xprt - > timeout , 2 , 60 * HZ ) ;
2005-08-11 16:25:23 -04:00
2006-08-22 20:06:18 -04:00
xs_format_peer_addresses ( xprt ) ;
2007-01-31 12:14:08 -05:00
dprintk ( " RPC: set up transport to address %s \n " ,
2006-12-05 16:35:37 -05:00
xprt - > address_strings [ RPC_DISPLAY_ALL ] ) ;
2006-08-22 20:06:18 -04:00
2006-10-17 14:44:27 -04:00
return xprt ;
2005-08-11 16:25:23 -04:00
}
2006-12-05 16:35:51 -05:00
/**
2006-12-05 16:35:54 -05:00
* init_socket_xprt - set up xprtsock ' s sysctls
2006-12-05 16:35:51 -05:00
*
*/
int init_socket_xprt ( void )
{
2006-12-05 16:35:54 -05:00
# ifdef RPC_DEBUG
2007-02-14 00:33:24 -08:00
if ( ! sunrpc_table_header )
2007-02-14 00:34:09 -08:00
sunrpc_table_header = register_sysctl_table ( sunrpc_table ) ;
2006-12-05 16:35:54 -05:00
# endif
2006-12-05 16:35:51 -05:00
return 0 ;
}
/**
2006-12-05 16:35:54 -05:00
* cleanup_socket_xprt - remove xprtsock ' s sysctls
2006-12-05 16:35:51 -05:00
*
*/
void cleanup_socket_xprt ( void )
{
2006-12-05 16:35:54 -05:00
# ifdef RPC_DEBUG
if ( sunrpc_table_header ) {
unregister_sysctl_table ( sunrpc_table_header ) ;
sunrpc_table_header = NULL ;
}
# endif
2006-12-05 16:35:51 -05:00
}