2020-03-27 14:48:38 -07:00
// SPDX-License-Identifier: GPL-2.0
/* Multipath TCP
*
* Copyright ( c ) 2019 , Intel Corporation .
*/
2020-04-03 17:14:08 +08:00
# define pr_fmt(fmt) "MPTCP: " fmt
2020-03-27 14:48:38 -07:00
# include <linux/kernel.h>
# include <net/tcp.h>
# include <net/mptcp.h>
# include "protocol.h"
2021-08-13 15:15:46 -07:00
# include "mib.h"
2020-03-27 14:48:38 -07:00
/* path manager command handlers */
int mptcp_pm_announce_addr ( struct mptcp_sock * msk ,
2020-09-24 08:29:50 +08:00
const struct mptcp_addr_info * addr ,
2021-03-26 11:26:31 -07:00
bool echo )
2020-03-27 14:48:38 -07:00
{
2020-12-09 15:51:27 -08:00
u8 add_addr = READ_ONCE ( msk - > pm . addr_signal ) ;
2020-11-19 11:45:59 -08:00
2021-08-23 18:05:40 -07:00
pr_debug ( " msk=%p, local_id=%d, echo=%d " , msk , addr - > id , echo ) ;
2020-03-27 14:48:41 -07:00
2021-02-04 15:23:30 -08:00
lockdep_assert_held ( & msk - > pm . lock ) ;
2021-08-23 18:05:40 -07:00
if ( add_addr &
( echo ? BIT ( MPTCP_ADD_ADDR_ECHO ) : BIT ( MPTCP_ADD_ADDR_SIGNAL ) ) ) {
pr_warn ( " addr_signal error, add_addr=%d, echo=%d " , add_addr , echo ) ;
2020-12-09 15:51:26 -08:00
return - EINVAL ;
}
2021-08-23 18:05:40 -07:00
if ( echo ) {
msk - > pm . remote = * addr ;
2020-11-19 11:45:59 -08:00
add_addr | = BIT ( MPTCP_ADD_ADDR_ECHO ) ;
2021-08-23 18:05:40 -07:00
} else {
msk - > pm . local = * addr ;
add_addr | = BIT ( MPTCP_ADD_ADDR_SIGNAL ) ;
}
2020-12-09 15:51:27 -08:00
WRITE_ONCE ( msk - > pm . addr_signal , add_addr ) ;
2020-03-27 14:48:41 -07:00
return 0 ;
2020-03-27 14:48:38 -07:00
}
2021-03-12 17:16:12 -08:00
int mptcp_pm_remove_addr ( struct mptcp_sock * msk , const struct mptcp_rm_list * rm_list )
2020-03-27 14:48:38 -07:00
{
2020-12-09 15:51:27 -08:00
u8 rm_addr = READ_ONCE ( msk - > pm . addr_signal ) ;
2020-12-09 15:51:26 -08:00
2021-03-12 17:16:12 -08:00
pr_debug ( " msk=%p, rm_list_nr=%d " , msk , rm_list - > nr ) ;
2020-09-24 08:29:54 +08:00
2020-12-09 15:51:26 -08:00
if ( rm_addr ) {
pr_warn ( " addr_signal error, rm_addr=%d " , rm_addr ) ;
return - EINVAL ;
}
2021-03-12 17:16:12 -08:00
msk - > pm . rm_list_tx = * rm_list ;
2020-12-09 15:51:26 -08:00
rm_addr | = BIT ( MPTCP_RM_ADDR_SIGNAL ) ;
2020-12-09 15:51:27 -08:00
WRITE_ONCE ( msk - > pm . addr_signal , rm_addr ) ;
2021-03-26 11:26:41 -07:00
mptcp_pm_nl_addr_send_ack ( msk ) ;
2020-09-24 08:29:54 +08:00
return 0 ;
2020-03-27 14:48:38 -07:00
}
2021-03-12 17:16:16 -08:00
int mptcp_pm_remove_subflow ( struct mptcp_sock * msk , const struct mptcp_rm_list * rm_list )
2020-03-27 14:48:38 -07:00
{
2021-03-12 17:16:16 -08:00
pr_debug ( " msk=%p, rm_list_nr=%d " , msk , rm_list - > nr ) ;
2020-09-24 08:29:55 +08:00
spin_lock_bh ( & msk - > pm . lock ) ;
2021-03-12 17:16:16 -08:00
mptcp_pm_nl_rm_subflow_received ( msk , rm_list ) ;
2020-09-24 08:29:55 +08:00
spin_unlock_bh ( & msk - > pm . lock ) ;
return 0 ;
2020-03-27 14:48:38 -07:00
}
/* path manager event handlers */
2021-02-12 15:59:58 -08:00
void mptcp_pm_new_connection ( struct mptcp_sock * msk , const struct sock * ssk , int server_side )
2020-03-27 14:48:38 -07:00
{
struct mptcp_pm_data * pm = & msk - > pm ;
pr_debug ( " msk=%p, token=%u side=%d " , msk , msk - > token , server_side ) ;
WRITE_ONCE ( pm - > server_side , server_side ) ;
2021-02-12 16:00:01 -08:00
mptcp_event ( MPTCP_EVENT_CREATED , msk , ssk , GFP_ATOMIC ) ;
2020-03-27 14:48:38 -07:00
}
bool mptcp_pm_allow_new_subflow ( struct mptcp_sock * msk )
{
2020-03-27 14:48:41 -07:00
struct mptcp_pm_data * pm = & msk - > pm ;
2021-02-01 15:09:07 -08:00
unsigned int subflows_max ;
2020-09-24 08:29:53 +08:00
int ret = 0 ;
2020-03-27 14:48:41 -07:00
2021-02-01 15:09:07 -08:00
subflows_max = mptcp_pm_get_subflows_max ( msk ) ;
2020-03-27 14:48:41 -07:00
pr_debug ( " msk=%p subflows=%d max=%d allow=%d " , msk , pm - > subflows ,
2021-02-01 15:09:07 -08:00
subflows_max , READ_ONCE ( pm - > accept_subflow ) ) ;
2020-03-27 14:48:41 -07:00
/* try to avoid acquiring the lock below */
if ( ! READ_ONCE ( pm - > accept_subflow ) )
return false ;
spin_lock_bh ( & pm - > lock ) ;
2020-09-24 08:29:53 +08:00
if ( READ_ONCE ( pm - > accept_subflow ) ) {
2021-02-01 15:09:07 -08:00
ret = pm - > subflows < subflows_max ;
if ( ret & & + + pm - > subflows = = subflows_max )
2020-09-24 08:29:53 +08:00
WRITE_ONCE ( pm - > accept_subflow , false ) ;
}
2020-03-27 14:48:41 -07:00
spin_unlock_bh ( & pm - > lock ) ;
return ret ;
}
/* return true if the new status bit is currently cleared, that is, this event
* can be server , eventually by an already scheduled work
*/
static bool mptcp_pm_schedule_work ( struct mptcp_sock * msk ,
enum mptcp_pm_status new_status )
{
pr_debug ( " msk=%p status=%x new=%lx " , msk , msk - > pm . status ,
BIT ( new_status ) ) ;
if ( msk - > pm . status & BIT ( new_status ) )
return false ;
msk - > pm . status | = BIT ( new_status ) ;
2020-11-16 10:48:05 +01:00
mptcp_schedule_work ( ( struct sock * ) msk ) ;
2020-03-27 14:48:41 -07:00
return true ;
2020-03-27 14:48:38 -07:00
}
2021-02-12 15:59:58 -08:00
void mptcp_pm_fully_established ( struct mptcp_sock * msk , const struct sock * ssk , gfp_t gfp )
2020-03-27 14:48:38 -07:00
{
2020-03-27 14:48:41 -07:00
struct mptcp_pm_data * pm = & msk - > pm ;
2021-02-12 16:00:01 -08:00
bool announce = false ;
2020-03-27 14:48:41 -07:00
2020-03-27 14:48:38 -07:00
pr_debug ( " msk=%p " , msk ) ;
2020-03-27 14:48:41 -07:00
spin_lock_bh ( & pm - > lock ) ;
2020-12-09 12:03:29 +01:00
/* mptcp_pm_fully_established() can be invoked by multiple
* racing paths - accept ( ) and check_fully_established ( )
* be sure to serve this event only once .
*/
if ( READ_ONCE ( pm - > work_pending ) & &
! ( msk - > pm . status & BIT ( MPTCP_PM_ALREADY_ESTABLISHED ) ) )
2020-03-27 14:48:41 -07:00
mptcp_pm_schedule_work ( msk , MPTCP_PM_ESTABLISHED ) ;
2021-02-12 16:00:01 -08:00
if ( ( msk - > pm . status & BIT ( MPTCP_PM_ALREADY_ESTABLISHED ) ) = = 0 )
announce = true ;
msk - > pm . status | = BIT ( MPTCP_PM_ALREADY_ESTABLISHED ) ;
2020-03-27 14:48:41 -07:00
spin_unlock_bh ( & pm - > lock ) ;
2021-02-12 16:00:01 -08:00
if ( announce )
mptcp_event ( MPTCP_EVENT_ESTABLISHED , msk , ssk , gfp ) ;
2020-03-27 14:48:38 -07:00
}
void mptcp_pm_connection_closed ( struct mptcp_sock * msk )
{
pr_debug ( " msk=%p " , msk ) ;
}
2021-03-26 11:26:33 -07:00
void mptcp_pm_subflow_established ( struct mptcp_sock * msk )
2020-03-27 14:48:38 -07:00
{
2020-03-27 14:48:41 -07:00
struct mptcp_pm_data * pm = & msk - > pm ;
2020-03-27 14:48:38 -07:00
pr_debug ( " msk=%p " , msk ) ;
2020-03-27 14:48:41 -07:00
if ( ! READ_ONCE ( pm - > work_pending ) )
return ;
spin_lock_bh ( & pm - > lock ) ;
if ( READ_ONCE ( pm - > work_pending ) )
mptcp_pm_schedule_work ( msk , MPTCP_PM_SUBFLOW_ESTABLISHED ) ;
spin_unlock_bh ( & pm - > lock ) ;
2020-03-27 14:48:38 -07:00
}
2022-01-06 16:20:23 -08:00
void mptcp_pm_subflow_check_next ( struct mptcp_sock * msk , const struct sock * ssk ,
const struct mptcp_subflow_context * subflow )
2020-03-27 14:48:38 -07:00
{
2022-01-06 16:20:23 -08:00
struct mptcp_pm_data * pm = & msk - > pm ;
bool update_subflows ;
update_subflows = ( ssk - > sk_state = = TCP_CLOSE ) & &
( subflow - > request_join | | subflow - > mp_join ) ;
if ( ! READ_ONCE ( pm - > work_pending ) & & ! update_subflows )
return ;
spin_lock_bh ( & pm - > lock ) ;
if ( update_subflows )
pm - > subflows - - ;
/* Even if this subflow is not really established, tell the PM to try
* to pick the next ones , if possible .
*/
if ( mptcp_pm_nl_check_work_pending ( msk ) )
mptcp_pm_schedule_work ( msk , MPTCP_PM_SUBFLOW_ESTABLISHED ) ;
spin_unlock_bh ( & pm - > lock ) ;
2020-03-27 14:48:38 -07:00
}
void mptcp_pm_add_addr_received ( struct mptcp_sock * msk ,
const struct mptcp_addr_info * addr )
{
2020-03-27 14:48:41 -07:00
struct mptcp_pm_data * pm = & msk - > pm ;
pr_debug ( " msk=%p remote_id=%d accept=%d " , msk , addr - > id ,
READ_ONCE ( pm - > accept_addr ) ) ;
2021-02-12 16:00:01 -08:00
mptcp_event_addr_announced ( msk , addr ) ;
2020-03-27 14:48:41 -07:00
spin_lock_bh ( & pm - > lock ) ;
2020-11-19 11:46:00 -08:00
if ( ! READ_ONCE ( pm - > accept_addr ) ) {
2021-03-26 11:26:31 -07:00
mptcp_pm_announce_addr ( msk , addr , true ) ;
2020-11-19 11:46:00 -08:00
mptcp_pm_add_addr_send_ack ( msk ) ;
} else if ( mptcp_pm_schedule_work ( msk , MPTCP_PM_ADD_ADDR_RECEIVED ) ) {
2020-03-27 14:48:41 -07:00
pm - > remote = * addr ;
2020-11-19 11:46:00 -08:00
}
2020-03-27 14:48:41 -07:00
spin_unlock_bh ( & pm - > lock ) ;
2020-11-19 11:46:00 -08:00
}
2021-03-26 11:26:38 -07:00
void mptcp_pm_add_addr_echoed ( struct mptcp_sock * msk ,
struct mptcp_addr_info * addr )
{
struct mptcp_pm_data * pm = & msk - > pm ;
pr_debug ( " msk=%p " , msk ) ;
spin_lock_bh ( & pm - > lock ) ;
if ( mptcp_lookup_anno_list_by_saddr ( msk , addr ) & & READ_ONCE ( pm - > work_pending ) )
mptcp_pm_schedule_work ( msk , MPTCP_PM_SUBFLOW_ESTABLISHED ) ;
spin_unlock_bh ( & pm - > lock ) ;
}
2020-11-19 11:46:00 -08:00
void mptcp_pm_add_addr_send_ack ( struct mptcp_sock * msk )
{
2021-02-01 15:09:09 -08:00
if ( ! mptcp_pm_should_add_signal ( msk ) )
2020-11-19 11:46:00 -08:00
return ;
mptcp_pm_schedule_work ( msk , MPTCP_PM_ADD_ADDR_SEND_ACK ) ;
2020-03-27 14:48:38 -07:00
}
2021-03-12 17:16:13 -08:00
void mptcp_pm_rm_addr_received ( struct mptcp_sock * msk ,
const struct mptcp_rm_list * rm_list )
2020-09-24 08:29:49 +08:00
{
struct mptcp_pm_data * pm = & msk - > pm ;
2021-03-12 17:16:13 -08:00
u8 i ;
2020-09-24 08:29:49 +08:00
2021-03-12 17:16:13 -08:00
pr_debug ( " msk=%p remote_ids_nr=%d " , msk , rm_list - > nr ) ;
2020-09-24 08:29:49 +08:00
2021-03-12 17:16:13 -08:00
for ( i = 0 ; i < rm_list - > nr ; i + + )
mptcp_event_addr_removed ( msk , rm_list - > ids [ i ] ) ;
2021-02-12 16:00:01 -08:00
2020-09-24 08:29:49 +08:00
spin_lock_bh ( & pm - > lock ) ;
mptcp_pm_schedule_work ( msk , MPTCP_PM_RM_ADDR_RECEIVED ) ;
2021-03-12 17:16:14 -08:00
pm - > rm_list_rx = * rm_list ;
2020-09-24 08:29:49 +08:00
spin_unlock_bh ( & pm - > lock ) ;
}
2021-01-08 16:47:58 -08:00
void mptcp_pm_mp_prio_received ( struct sock * sk , u8 bkup )
{
struct mptcp_subflow_context * subflow = mptcp_subflow_ctx ( sk ) ;
pr_debug ( " subflow->backup=%d, bkup=%d \n " , subflow - > backup , bkup ) ;
subflow - > backup = bkup ;
2021-02-12 16:00:01 -08:00
mptcp_event ( MPTCP_EVENT_SUB_PRIORITY , mptcp_sk ( subflow - > conn ) , sk , GFP_ATOMIC ) ;
2021-01-08 16:47:58 -08:00
}
2021-08-24 16:26:16 -07:00
void mptcp_pm_mp_fail_received ( struct sock * sk , u64 fail_seq )
{
pr_debug ( " fail_seq=%llu " , fail_seq ) ;
}
2020-03-27 14:48:38 -07:00
/* path manager helpers */
2021-08-23 18:05:39 -07:00
bool mptcp_pm_add_addr_signal ( struct mptcp_sock * msk , struct sk_buff * skb ,
unsigned int opt_size , unsigned int remaining ,
2021-08-23 18:05:42 -07:00
struct mptcp_addr_info * addr , bool * echo ,
2021-08-23 18:05:39 -07:00
bool * port , bool * drop_other_suboptions )
2020-03-27 14:48:38 -07:00
{
2020-03-27 14:48:41 -07:00
int ret = false ;
2021-08-23 18:05:41 -07:00
u8 add_addr ;
2021-08-23 18:05:42 -07:00
u8 family ;
2020-03-27 14:48:41 -07:00
spin_lock_bh ( & msk - > pm . lock ) ;
/* double check after the lock is acquired */
2020-09-24 08:29:47 +08:00
if ( ! mptcp_pm_should_add_signal ( msk ) )
2020-03-27 14:48:41 -07:00
goto out_unlock ;
2021-08-23 18:05:39 -07:00
/* always drop every other options for pure ack ADD_ADDR; this is a
* plain dup - ack from TCP perspective . The other MPTCP - relevant info ,
* if any , will be carried by the ' original ' TCP ack
*/
if ( skb & & skb_is_tcp_pure_ack ( skb ) ) {
remaining + = opt_size ;
* drop_other_suboptions = true ;
}
2020-11-19 11:45:59 -08:00
* echo = mptcp_pm_should_add_signal_echo ( msk ) ;
2021-08-23 18:05:43 -07:00
* port = ! ! ( * echo ? msk - > pm . remote . port : msk - > pm . local . port ) ;
2020-10-03 17:36:56 +02:00
2021-08-23 18:05:42 -07:00
family = * echo ? msk - > pm . remote . family : msk - > pm . local . family ;
if ( remaining < mptcp_add_addr_len ( family , * echo , * port ) )
2020-03-27 14:48:41 -07:00
goto out_unlock ;
2021-08-23 18:05:42 -07:00
if ( * echo ) {
* addr = msk - > pm . remote ;
2021-08-23 18:05:41 -07:00
add_addr = msk - > pm . addr_signal & ~ BIT ( MPTCP_ADD_ADDR_ECHO ) ;
2021-08-23 18:05:42 -07:00
} else {
* addr = msk - > pm . local ;
2021-08-23 18:05:41 -07:00
add_addr = msk - > pm . addr_signal & ~ BIT ( MPTCP_ADD_ADDR_SIGNAL ) ;
2021-08-23 18:05:42 -07:00
}
2021-08-23 18:05:41 -07:00
WRITE_ONCE ( msk - > pm . addr_signal , add_addr ) ;
2020-03-27 14:48:41 -07:00
ret = true ;
out_unlock :
spin_unlock_bh ( & msk - > pm . lock ) ;
return ret ;
2020-03-27 14:48:38 -07:00
}
2020-09-24 08:29:48 +08:00
bool mptcp_pm_rm_addr_signal ( struct mptcp_sock * msk , unsigned int remaining ,
2021-03-12 17:16:11 -08:00
struct mptcp_rm_list * rm_list )
2020-09-24 08:29:48 +08:00
{
2021-03-12 17:16:12 -08:00
int ret = false , len ;
2021-08-23 18:05:41 -07:00
u8 rm_addr ;
2020-09-24 08:29:48 +08:00
spin_lock_bh ( & msk - > pm . lock ) ;
/* double check after the lock is acquired */
if ( ! mptcp_pm_should_rm_signal ( msk ) )
goto out_unlock ;
2021-08-23 18:05:41 -07:00
rm_addr = msk - > pm . addr_signal & ~ BIT ( MPTCP_RM_ADDR_SIGNAL ) ;
2021-03-12 17:16:12 -08:00
len = mptcp_rm_addr_len ( & msk - > pm . rm_list_tx ) ;
if ( len < 0 ) {
2021-08-23 18:05:41 -07:00
WRITE_ONCE ( msk - > pm . addr_signal , rm_addr ) ;
2021-03-12 17:16:12 -08:00
goto out_unlock ;
}
if ( remaining < len )
2020-09-24 08:29:48 +08:00
goto out_unlock ;
2021-03-12 17:16:12 -08:00
* rm_list = msk - > pm . rm_list_tx ;
2021-08-23 18:05:41 -07:00
WRITE_ONCE ( msk - > pm . addr_signal , rm_addr ) ;
2020-09-24 08:29:48 +08:00
ret = true ;
out_unlock :
spin_unlock_bh ( & msk - > pm . lock ) ;
return ret ;
}
2020-03-27 14:48:38 -07:00
int mptcp_pm_get_local_id ( struct mptcp_sock * msk , struct sock_common * skc )
{
2020-03-27 14:48:51 -07:00
return mptcp_pm_nl_get_local_id ( msk , skc ) ;
2020-03-27 14:48:38 -07:00
}
2021-08-13 15:15:42 -07:00
void mptcp_pm_subflow_chk_stale ( const struct mptcp_sock * msk , struct sock * ssk )
{
struct mptcp_subflow_context * subflow = mptcp_subflow_ctx ( ssk ) ;
u32 rcv_tstamp = READ_ONCE ( tcp_sk ( ssk ) - > rcv_tstamp ) ;
/* keep track of rtx periods with no progress */
if ( ! subflow - > stale_count ) {
subflow - > stale_rcv_tstamp = rcv_tstamp ;
subflow - > stale_count + + ;
} else if ( subflow - > stale_rcv_tstamp = = rcv_tstamp ) {
if ( subflow - > stale_count < U8_MAX )
subflow - > stale_count + + ;
2021-08-13 15:15:45 -07:00
mptcp_pm_nl_subflow_chk_stale ( msk , ssk ) ;
2021-08-13 15:15:42 -07:00
} else {
subflow - > stale_count = 0 ;
2021-08-13 15:15:45 -07:00
mptcp_subflow_set_active ( subflow ) ;
2021-08-13 15:15:42 -07:00
}
}
2022-01-06 16:20:16 -08:00
void mptcp_pm_data_reset ( struct mptcp_sock * msk )
2020-03-27 14:48:38 -07:00
{
msk - > pm . add_addr_signaled = 0 ;
msk - > pm . add_addr_accepted = 0 ;
msk - > pm . local_addr_used = 0 ;
msk - > pm . subflows = 0 ;
2021-03-12 17:16:12 -08:00
msk - > pm . rm_list_tx . nr = 0 ;
2021-03-12 17:16:14 -08:00
msk - > pm . rm_list_rx . nr = 0 ;
2020-03-27 14:48:38 -07:00
WRITE_ONCE ( msk - > pm . work_pending , false ) ;
2020-12-09 15:51:27 -08:00
WRITE_ONCE ( msk - > pm . addr_signal , 0 ) ;
2020-03-27 14:48:38 -07:00
WRITE_ONCE ( msk - > pm . accept_addr , false ) ;
WRITE_ONCE ( msk - > pm . accept_subflow , false ) ;
2021-06-22 12:25:20 -07:00
WRITE_ONCE ( msk - > pm . remote_deny_join_id0 , false ) ;
2020-03-27 14:48:38 -07:00
msk - > pm . status = 0 ;
2022-01-06 16:20:22 -08:00
bitmap_fill ( msk - > pm . id_avail_bitmap , MPTCP_PM_MAX_ADDR_ID + 1 ) ;
2020-03-27 14:48:38 -07:00
2022-01-06 16:20:16 -08:00
mptcp_pm_nl_data_init ( msk ) ;
}
void mptcp_pm_data_init ( struct mptcp_sock * msk )
{
2020-03-27 14:48:38 -07:00
spin_lock_init ( & msk - > pm . lock ) ;
2020-09-24 08:29:54 +08:00
INIT_LIST_HEAD ( & msk - > pm . anno_list ) ;
2022-01-06 16:20:16 -08:00
mptcp_pm_data_reset ( msk ) ;
2020-03-27 14:48:38 -07:00
}
2020-06-26 19:29:59 +02:00
void __init mptcp_pm_init ( void )
2020-03-27 14:48:38 -07:00
{
2020-03-27 14:48:51 -07:00
mptcp_pm_nl_init ( ) ;
2020-03-27 14:48:38 -07:00
}