2019-05-20 20:08:01 +03:00
// SPDX-License-Identifier: GPL-2.0-or-later
2018-10-20 02:57:57 +03:00
/* Handle vlserver selection and rotation.
*
* Copyright ( C ) 2018 Red Hat , Inc . All Rights Reserved .
* Written by David Howells ( dhowells @ redhat . com )
*/
# include <linux/kernel.h>
# include <linux/sched.h>
# include <linux/sched/signal.h>
# include "internal.h"
# include "afs_vl.h"
/*
* Begin an operation on a volume location server .
*/
bool afs_begin_vlserver_operation ( struct afs_vl_cursor * vc , struct afs_cell * cell ,
struct key * key )
{
memset ( vc , 0 , sizeof ( * vc ) ) ;
vc - > cell = cell ;
vc - > key = key ;
vc - > error = - EDESTADDRREQ ;
vc - > ac . error = SHRT_MAX ;
if ( signal_pending ( current ) ) {
vc - > error = - EINTR ;
vc - > flags | = AFS_VL_CURSOR_STOP ;
return false ;
}
return true ;
}
/*
* Begin iteration through a server list , starting with the last used server if
* possible , or the last recorded good server if not .
*/
static bool afs_start_vl_iteration ( struct afs_vl_cursor * vc )
{
struct afs_cell * cell = vc - > cell ;
2019-05-07 17:06:36 +03:00
unsigned int dns_lookup_count ;
2018-10-20 02:57:57 +03:00
2019-05-07 17:06:36 +03:00
if ( cell - > dns_source = = DNS_RECORD_UNAVAILABLE | |
cell - > dns_expiry < = ktime_get_real_seconds ( ) ) {
dns_lookup_count = smp_load_acquire ( & cell - > dns_lookup_count ) ;
set_bit ( AFS_CELL_FL_DO_LOOKUP , & cell - > flags ) ;
2020-10-13 22:51:59 +03:00
afs_queue_cell ( cell , afs_cell_trace_get_queue_dns ) ;
2019-05-07 17:06:36 +03:00
if ( cell - > dns_source = = DNS_RECORD_UNAVAILABLE ) {
if ( wait_var_event_interruptible (
& cell - > dns_lookup_count ,
smp_load_acquire ( & cell - > dns_lookup_count )
! = dns_lookup_count ) < 0 ) {
vc - > error = - ERESTARTSYS ;
return false ;
}
}
/* Status load is ordered after lookup counter load */
if ( cell - > dns_source = = DNS_RECORD_UNAVAILABLE ) {
vc - > error = - EDESTADDRREQ ;
return false ;
}
2018-10-20 02:57:57 +03:00
}
read_lock ( & cell - > vl_servers_lock ) ;
vc - > server_list = afs_get_vlserverlist (
rcu_dereference_protected ( cell - > vl_servers ,
lockdep_is_held ( & cell - > vl_servers_lock ) ) ) ;
read_unlock ( & cell - > vl_servers_lock ) ;
2019-05-07 17:30:34 +03:00
if ( ! vc - > server_list - > nr_servers )
2018-10-20 02:57:57 +03:00
return false ;
2018-10-20 02:57:59 +03:00
vc - > untried = ( 1UL < < vc - > server_list - > nr_servers ) - 1 ;
vc - > index = - 1 ;
2018-10-20 02:57:57 +03:00
return true ;
}
/*
* Select the vlserver to use . May be called multiple times to rotate
* through the vlservers .
*/
bool afs_select_vlserver ( struct afs_vl_cursor * vc )
{
struct afs_addr_list * alist ;
struct afs_vlserver * vlserver ;
2018-11-14 02:20:28 +03:00
struct afs_error e ;
2018-10-20 02:57:59 +03:00
u32 rtt ;
2018-11-14 02:20:28 +03:00
int error = vc - > ac . error , i ;
2018-10-20 02:57:57 +03:00
2018-10-20 02:57:59 +03:00
_enter ( " %lx[%d],%lx[%d],%d,%d " ,
vc - > untried , vc - > index ,
vc - > ac . tried , vc - > ac . index ,
2018-10-20 02:57:57 +03:00
error , vc - > ac . abort_code ) ;
if ( vc - > flags & AFS_VL_CURSOR_STOP ) {
_leave ( " = f [stopped] " ) ;
return false ;
}
2018-10-20 02:57:58 +03:00
vc - > nr_iterations + + ;
2018-10-20 02:57:57 +03:00
/* Evaluate the result of the previous operation, if there was one. */
switch ( error ) {
case SHRT_MAX :
goto start ;
default :
case 0 :
/* Success or local failure. Stop. */
vc - > error = error ;
vc - > flags | = AFS_VL_CURSOR_STOP ;
_leave ( " = f [okay/local %d] " , vc - > ac . error ) ;
return false ;
case - ECONNABORTED :
/* The far side rejected the operation on some grounds. This
* might involve the server being busy or the volume having been moved .
*/
switch ( vc - > ac . abort_code ) {
case AFSVL_IO :
case AFSVL_BADVOLOPER :
case AFSVL_NOMEM :
/* The server went weird. */
vc - > error = - EREMOTEIO ;
//write_lock(&vc->cell->vl_servers_lock);
//vc->server_list->weird_mask |= 1 << vc->index;
//write_unlock(&vc->cell->vl_servers_lock);
goto next_server ;
default :
vc - > error = afs_abort_to_error ( vc - > ac . abort_code ) ;
goto failed ;
}
2018-11-14 02:20:28 +03:00
case - ERFKILL :
case - EADDRNOTAVAIL :
2018-10-20 02:57:57 +03:00
case - ENETUNREACH :
case - EHOSTUNREACH :
2018-11-14 02:20:28 +03:00
case - EHOSTDOWN :
2018-10-20 02:57:57 +03:00
case - ECONNREFUSED :
case - ETIMEDOUT :
case - ETIME :
_debug ( " no conn %d " , error ) ;
vc - > error = error ;
goto iterate_address ;
case - ECONNRESET :
_debug ( " call reset " ) ;
vc - > error = error ;
vc - > flags | = AFS_VL_CURSOR_RETRY ;
goto next_server ;
2020-04-27 17:01:09 +03:00
case - EOPNOTSUPP :
_debug ( " notsupp " ) ;
goto next_server ;
2018-10-20 02:57:57 +03:00
}
restart_from_beginning :
_debug ( " restart " ) ;
afs_end_cursor ( & vc - > ac ) ;
afs_put_vlserverlist ( vc - > cell - > net , vc - > server_list ) ;
vc - > server_list = NULL ;
if ( vc - > flags & AFS_VL_CURSOR_RETRIED )
goto failed ;
vc - > flags | = AFS_VL_CURSOR_RETRIED ;
start :
_debug ( " start " ) ;
if ( ! afs_start_vl_iteration ( vc ) )
goto failed ;
2018-10-20 02:57:59 +03:00
error = afs_send_vl_probes ( vc - > cell - > net , vc - > key , vc - > server_list ) ;
if ( error < 0 )
goto failed_set_error ;
pick_server :
_debug ( " pick [%lx] " , vc - > untried ) ;
error = afs_wait_for_vl_probes ( vc - > server_list , vc - > untried ) ;
if ( error < 0 )
goto failed_set_error ;
/* Pick the untried server with the lowest RTT. */
vc - > index = vc - > server_list - > preferred ;
if ( test_bit ( vc - > index , & vc - > untried ) )
goto selected_server ;
vc - > index = - 1 ;
rtt = U32_MAX ;
for ( i = 0 ; i < vc - > server_list - > nr_servers ; i + + ) {
struct afs_vlserver * s = vc - > server_list - > servers [ i ] . server ;
2020-08-20 17:01:54 +03:00
if ( ! test_bit ( i , & vc - > untried ) | |
2020-08-19 17:27:17 +03:00
! test_bit ( AFS_VLSERVER_FL_RESPONDING , & s - > flags ) )
2018-10-20 02:57:59 +03:00
continue ;
if ( s - > probe . rtt < rtt ) {
vc - > index = i ;
rtt = s - > probe . rtt ;
}
}
if ( vc - > index = = - 1 )
goto no_more_servers ;
selected_server :
_debug ( " use %d " , vc - > index ) ;
__clear_bit ( vc - > index , & vc - > untried ) ;
2018-10-20 02:57:57 +03:00
/* We're starting on a different vlserver from the list. We need to
* check it , find its address list and probe its capabilities before we
* use it .
*/
ASSERTCMP ( vc - > ac . alist , = = , NULL ) ;
vlserver = vc - > server_list - > servers [ vc - > index ] . server ;
2018-10-20 02:57:59 +03:00
vc - > server = vlserver ;
2018-10-20 02:57:57 +03:00
_debug ( " USING VLSERVER: %s " , vlserver - > name ) ;
read_lock ( & vlserver - > lock ) ;
alist = rcu_dereference_protected ( vlserver - > addresses ,
lockdep_is_held ( & vlserver - > lock ) ) ;
afs_get_addrlist ( alist ) ;
read_unlock ( & vlserver - > lock ) ;
memset ( & vc - > ac , 0 , sizeof ( vc - > ac ) ) ;
if ( ! vc - > ac . alist )
vc - > ac . alist = alist ;
else
afs_put_addrlist ( alist ) ;
2018-10-20 02:57:59 +03:00
vc - > ac . index = - 1 ;
2018-10-20 02:57:57 +03:00
iterate_address :
ASSERT ( vc - > ac . alist ) ;
/* Iterate over the current server's address list to try and find an
* address on which it will respond to us .
*/
if ( ! afs_iterate_addresses ( & vc - > ac ) )
goto next_server ;
2018-10-20 02:57:59 +03:00
_debug ( " VL address %d/%d " , vc - > ac . index , vc - > ac . alist - > nr_addrs ) ;
2018-10-20 02:57:59 +03:00
_leave ( " = t %pISpc " , & vc - > ac . alist - > addrs [ vc - > ac . index ] . transport ) ;
2018-10-20 02:57:57 +03:00
return true ;
next_server :
_debug ( " next " ) ;
afs_end_cursor ( & vc - > ac ) ;
2018-10-20 02:57:59 +03:00
goto pick_server ;
2018-10-20 02:57:57 +03:00
2018-10-20 02:57:59 +03:00
no_more_servers :
2018-10-20 02:57:57 +03:00
/* That's all the servers poked to no good effect. Try again if some
* of them were busy .
*/
if ( vc - > flags & AFS_VL_CURSOR_RETRY )
goto restart_from_beginning ;
2018-11-14 02:20:28 +03:00
e . error = - EDESTADDRREQ ;
e . responded = false ;
2018-10-20 02:57:59 +03:00
for ( i = 0 ; i < vc - > server_list - > nr_servers ; i + + ) {
struct afs_vlserver * s = vc - > server_list - > servers [ i ] . server ;
2020-08-20 18:13:05 +03:00
if ( test_bit ( AFS_VLSERVER_FL_RESPONDING , & s - > flags ) )
e . responded = true ;
2018-11-14 02:20:28 +03:00
afs_prioritise_error ( & e , READ_ONCE ( s - > probe . error ) ,
s - > probe . abort_code ) ;
2018-10-20 02:57:59 +03:00
}
2020-08-20 18:13:05 +03:00
error = e . error ;
2018-10-20 02:57:59 +03:00
failed_set_error :
vc - > error = error ;
2018-10-20 02:57:57 +03:00
failed :
vc - > flags | = AFS_VL_CURSOR_STOP ;
afs_end_cursor ( & vc - > ac ) ;
_leave ( " = f [failed %d] " , vc - > error ) ;
return false ;
}
2018-10-20 02:57:58 +03:00
/*
* Dump cursor state in the case of the error being EDESTADDRREQ .
*/
static void afs_vl_dump_edestaddrreq ( const struct afs_vl_cursor * vc )
{
static int count ;
int i ;
if ( ! IS_ENABLED ( CONFIG_AFS_DEBUG_CURSOR ) | | count > 3 )
return ;
count + + ;
rcu_read_lock ( ) ;
pr_notice ( " EDESTADDR occurred \n " ) ;
2018-10-20 02:57:59 +03:00
pr_notice ( " VC: ut=%lx ix=%u ni=%hu fl=%hx err=%hd \n " ,
vc - > untried , vc - > index , vc - > nr_iterations , vc - > flags , vc - > error ) ;
2018-10-20 02:57:58 +03:00
if ( vc - > server_list ) {
const struct afs_vlserver_list * sl = vc - > server_list ;
pr_notice ( " VC: SL nr=%u ix=%u \n " ,
sl - > nr_servers , sl - > index ) ;
for ( i = 0 ; i < sl - > nr_servers ; i + + ) {
const struct afs_vlserver * s = sl - > servers [ i ] . server ;
2018-10-20 02:57:59 +03:00
pr_notice ( " VC: server %s+%hu fl=%lx E=%hd \n " ,
s - > name , s - > port , s - > flags , s - > probe . error ) ;
2018-10-20 02:57:58 +03:00
if ( s - > addresses ) {
const struct afs_addr_list * a =
rcu_dereference ( s - > addresses ) ;
2018-10-20 02:57:59 +03:00
pr_notice ( " VC: - nr=%u/%u/%u pf=%u \n " ,
2018-10-20 02:57:58 +03:00
a - > nr_ipv4 , a - > nr_addrs , a - > max_addrs ,
2018-10-20 02:57:59 +03:00
a - > preferred ) ;
2020-04-24 13:23:17 +03:00
pr_notice ( " VC: - R=%lx F=%lx \n " ,
a - > responded , a - > failed ) ;
2018-10-20 02:57:58 +03:00
if ( a = = vc - > ac . alist )
pr_notice ( " VC: - current \n " ) ;
}
}
}
2018-10-20 02:57:59 +03:00
pr_notice ( " AC: t=%lx ax=%u ac=%d er=%d r=%u ni=%u \n " ,
vc - > ac . tried , vc - > ac . index , vc - > ac . abort_code , vc - > ac . error ,
vc - > ac . responded , vc - > ac . nr_iterations ) ;
2018-10-20 02:57:58 +03:00
rcu_read_unlock ( ) ;
}
2018-10-20 02:57:57 +03:00
/*
* Tidy up a volume location server cursor and unlock the vnode .
*/
int afs_end_vlserver_operation ( struct afs_vl_cursor * vc )
{
struct afs_net * net = vc - > cell - > net ;
2018-10-20 02:57:58 +03:00
if ( vc - > error = = - EDESTADDRREQ | |
2018-11-14 02:20:28 +03:00
vc - > error = = - EADDRNOTAVAIL | |
2018-10-20 02:57:58 +03:00
vc - > error = = - ENETUNREACH | |
vc - > error = = - EHOSTUNREACH )
afs_vl_dump_edestaddrreq ( vc ) ;
2018-10-20 02:57:57 +03:00
afs_end_cursor ( & vc - > ac ) ;
afs_put_vlserverlist ( net , vc - > server_list ) ;
if ( vc - > error = = - ECONNABORTED )
vc - > error = afs_abort_to_error ( vc - > ac . abort_code ) ;
return vc - > error ;
}