2009-08-21 16:28:31 +04:00
/*
* Copyright ( c ) 2006 Oracle . All rights reserved .
*
* This software is available to you under a choice of one of two
* licenses . You may choose to be licensed under the terms of the GNU
* General Public License ( GPL ) Version 2 , available from the file
* COPYING in the main directory of this source tree , or the
* OpenIB . org BSD license below :
*
* Redistribution and use in source and binary forms , with or
* without modification , are permitted provided that the following
* conditions are met :
*
* - Redistributions of source code must retain the above
* copyright notice , this list of conditions and the following
* disclaimer .
*
* - Redistributions in binary form must reproduce the above
* copyright notice , this list of conditions and the following
* disclaimer in the documentation and / or other materials
* provided with the distribution .
*
* THE SOFTWARE IS PROVIDED " AS IS " , WITHOUT WARRANTY OF ANY KIND ,
* EXPRESS OR IMPLIED , INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY , FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT . IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
* BE LIABLE FOR ANY CLAIM , DAMAGES OR OTHER LIABILITY , WHETHER IN AN
* ACTION OF CONTRACT , TORT OR OTHERWISE , ARISING FROM , OUT OF OR IN
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE .
*
*/
# include <linux/kernel.h>
# include <linux/in.h>
# include <net/tcp.h>
2016-06-13 19:44:26 +03:00
# include "rds_single_path.h"
2009-08-21 16:28:31 +04:00
# include "rds.h"
# include "tcp.h"
void rds_tcp_state_change ( struct sock * sk )
{
void ( * state_change ) ( struct sock * sk ) ;
2016-07-01 02:11:14 +03:00
struct rds_conn_path * cp ;
2009-08-21 16:28:31 +04:00
struct rds_tcp_connection * tc ;
2016-05-18 03:44:08 +03:00
read_lock_bh ( & sk - > sk_callback_lock ) ;
2016-07-01 02:11:14 +03:00
cp = sk - > sk_user_data ;
if ( ! cp ) {
2009-08-21 16:28:31 +04:00
state_change = sk - > sk_state_change ;
goto out ;
}
2016-07-01 02:11:14 +03:00
tc = cp - > cp_transport_data ;
2009-08-21 16:28:31 +04:00
state_change = tc - > t_orig_state_change ;
rdsdebug ( " sock %p state_change to %d \n " , tc - > t_sock , sk - > sk_state ) ;
2016-06-18 18:46:31 +03:00
switch ( sk - > sk_state ) {
/* ignore connecting sockets as they make progress */
case TCP_SYN_SENT :
case TCP_SYN_RECV :
break ;
case TCP_ESTABLISHED :
2016-07-01 02:11:14 +03:00
rds_connect_path_complete ( cp , RDS_CONN_CONNECTING ) ;
2016-06-18 18:46:31 +03:00
break ;
case TCP_CLOSE_WAIT :
case TCP_CLOSE :
2016-07-01 02:11:14 +03:00
rds_conn_path_drop ( cp ) ;
2016-06-18 18:46:31 +03:00
default :
break ;
2009-08-21 16:28:31 +04:00
}
out :
2016-05-18 03:44:08 +03:00
read_unlock_bh ( & sk - > sk_callback_lock ) ;
2009-08-21 16:28:31 +04:00
state_change ( sk ) ;
}
int rds_tcp_conn_connect ( struct rds_connection * conn )
{
struct socket * sock = NULL ;
struct sockaddr_in src , dest ;
int ret ;
2016-05-02 21:24:52 +03:00
struct rds_tcp_connection * tc = conn - > c_transport_data ;
2016-07-01 02:11:14 +03:00
struct rds_conn_path * cp = & conn - > c_path [ 0 ] ;
2016-05-02 21:24:52 +03:00
2016-07-01 02:11:12 +03:00
mutex_lock ( & tc - > t_conn_path_lock ) ;
2009-08-21 16:28:31 +04:00
2016-05-02 21:24:52 +03:00
if ( rds_conn_up ( conn ) ) {
2016-07-01 02:11:12 +03:00
mutex_unlock ( & tc - > t_conn_path_lock ) ;
2016-05-02 21:24:52 +03:00
return 0 ;
}
2015-08-05 08:43:25 +03:00
ret = sock_create_kern ( rds_conn_net ( conn ) , PF_INET ,
SOCK_STREAM , IPPROTO_TCP , & sock ) ;
2009-08-21 16:28:31 +04:00
if ( ret < 0 )
goto out ;
rds_tcp_tune ( sock ) ;
src . sin_family = AF_INET ;
src . sin_addr . s_addr = ( __force u32 ) conn - > c_laddr ;
src . sin_port = ( __force u16 ) htons ( 0 ) ;
ret = sock - > ops - > bind ( sock , ( struct sockaddr * ) & src , sizeof ( src ) ) ;
if ( ret ) {
2010-02-02 15:43:59 +03:00
rdsdebug ( " bind failed with %d at address %pI4 \n " ,
ret , & conn - > c_laddr ) ;
2009-08-21 16:28:31 +04:00
goto out ;
}
dest . sin_family = AF_INET ;
dest . sin_addr . s_addr = ( __force u32 ) conn - > c_faddr ;
dest . sin_port = ( __force u16 ) htons ( RDS_TCP_PORT ) ;
/*
* once we call connect ( ) we can start getting callbacks and they
* own the socket
*/
2016-07-01 02:11:14 +03:00
rds_tcp_set_callbacks ( sock , cp ) ;
2009-08-21 16:28:31 +04:00
ret = sock - > ops - > connect ( sock , ( struct sockaddr * ) & dest , sizeof ( dest ) ,
O_NONBLOCK ) ;
2010-02-02 15:43:59 +03:00
rdsdebug ( " connect to address %pI4 returned %d \n " , & conn - > c_faddr , ret ) ;
2009-08-21 16:28:31 +04:00
if ( ret = = - EINPROGRESS )
ret = 0 ;
2015-08-05 08:43:26 +03:00
if ( ret = = 0 ) {
rds_tcp_keepalive ( sock ) ;
2014-10-02 01:49:53 +04:00
sock = NULL ;
2015-08-05 08:43:26 +03:00
} else {
2014-10-02 01:49:53 +04:00
rds_tcp_restore_callbacks ( sock , conn - > c_transport_data ) ;
2015-08-05 08:43:26 +03:00
}
2009-08-21 16:28:31 +04:00
out :
2016-07-01 02:11:12 +03:00
mutex_unlock ( & tc - > t_conn_path_lock ) ;
2009-08-21 16:28:31 +04:00
if ( sock )
sock_release ( sock ) ;
return ret ;
}
/*
* Before killing the tcp socket this needs to serialize with callbacks . The
* caller has already grabbed the sending sem so we ' re serialized with other
* senders .
*
* TCP calls the callbacks with the sock lock so we hold it while we reset the
* callbacks to those set by TCP . Our callbacks won ' t execute again once we
* hold the sock lock .
*/
2016-07-01 02:11:10 +03:00
void rds_tcp_conn_path_shutdown ( struct rds_conn_path * cp )
2009-08-21 16:28:31 +04:00
{
2016-07-01 02:11:10 +03:00
struct rds_tcp_connection * tc = cp - > cp_transport_data ;
2009-08-21 16:28:31 +04:00
struct socket * sock = tc - > t_sock ;
2016-07-01 02:11:10 +03:00
rdsdebug ( " shutting down conn %p tc %p sock %p \n " ,
cp - > cp_conn , tc , sock ) ;
2009-08-21 16:28:31 +04:00
if ( sock ) {
sock - > ops - > shutdown ( sock , RCV_SHUTDOWN | SEND_SHUTDOWN ) ;
lock_sock ( sock - > sk ) ;
rds_tcp_restore_callbacks ( sock , tc ) ; /* tc->tc_sock = NULL */
release_sock ( sock - > sk ) ;
sock_release ( sock ) ;
2010-05-14 14:58:26 +04:00
}
2009-08-21 16:28:31 +04:00
if ( tc - > t_tinc ) {
rds_inc_put ( & tc - > t_tinc - > ti_inc ) ;
tc - > t_tinc = NULL ;
}
tc - > t_tinc_hdr_rem = sizeof ( struct rds_header ) ;
tc - > t_tinc_data_rem = 0 ;
}