2005-08-10 07:14:34 +04:00
# ifndef _CCID_H
# define _CCID_H
/*
* net / dccp / ccid . h
*
* An implementation of the DCCP protocol
* Arnaldo Carvalho de Melo < acme @ conectiva . com . br >
*
* CCID infrastructure
*
* This program is free software ; you can redistribute it and / or modify it
* under the terms of the GNU General Public License version 2 as
* published by the Free Software Foundation .
*/
# include <net/sock.h>
2005-09-18 11:19:32 +04:00
# include <linux/compiler.h>
2005-08-10 07:14:34 +04:00
# include <linux/dccp.h>
# include <linux/list.h>
# include <linux/module.h>
2010-02-01 05:12:19 +03:00
/* maximum value for a CCID (RFC 4340, 19.5) */
# define CCID_MAX 255
# define CCID_SLAB_NAME_LENGTH 32
2005-08-10 07:14:34 +04:00
2005-12-27 07:43:12 +03:00
struct tcp_info ;
2007-12-14 04:31:14 +03:00
/**
* struct ccid_operations - Interface to Congestion - Control Infrastructure
*
* @ ccid_id : numerical CCID ID ( up to % CCID_MAX , cf . table 5 in RFC 4340 , 10. )
2007-12-14 04:37:55 +03:00
* @ ccid_ccmps : the CCMPS including network / transport headers ( 0 when disabled )
2007-12-14 04:31:14 +03:00
* @ ccid_name : alphabetical identifier string for @ ccid_id
* @ ccid_hc_ { r , t } x_slab : memory pool for the receiver / sender half - connection
* @ ccid_hc_ { r , t } x_obj_size : size of the receiver / sender half - connection socket
*
* @ ccid_hc_ { r , t } x_init : CCID - specific initialisation routine ( before startup )
* @ ccid_hc_ { r , t } x_exit : CCID - specific cleanup routine ( before destruction )
* @ ccid_hc_rx_packet_recv : implements the HC - receiver side
* @ ccid_hc_ { r , t } x_parse_options : parsing routine for CCID / HC - specific options
* @ ccid_hc_ { r , t } x_insert_options : insert routine for CCID / HC - specific options
* @ ccid_hc_tx_packet_recv : implements feedback processing for the HC - sender
* @ ccid_hc_tx_send_packet : implements the sending part of the HC - sender
* @ ccid_hc_tx_packet_sent : does accounting for packets in flight by HC - sender
* @ ccid_hc_ { r , t } x_get_info : INET_DIAG information for HC - receiver / sender
* @ ccid_hc_ { r , t } x_getsockopt : socket options specific to HC - receiver / sender
*/
2006-03-21 06:21:44 +03:00
struct ccid_operations {
2007-12-14 04:31:14 +03:00
unsigned char ccid_id ;
2007-12-14 04:37:55 +03:00
__u32 ccid_ccmps ;
2007-12-14 04:31:14 +03:00
const char * ccid_name ;
struct kmem_cache * ccid_hc_rx_slab ,
* ccid_hc_tx_slab ;
2010-02-01 05:12:19 +03:00
char ccid_hc_rx_slab_name [ CCID_SLAB_NAME_LENGTH ] ;
char ccid_hc_tx_slab_name [ CCID_SLAB_NAME_LENGTH ] ;
2007-12-14 04:31:14 +03:00
__u32 ccid_hc_rx_obj_size ,
ccid_hc_tx_obj_size ;
/* Interface Routines */
2006-03-21 06:21:44 +03:00
int ( * ccid_hc_rx_init ) ( struct ccid * ccid , struct sock * sk ) ;
int ( * ccid_hc_tx_init ) ( struct ccid * ccid , struct sock * sk ) ;
2005-08-10 07:14:34 +04:00
void ( * ccid_hc_rx_exit ) ( struct sock * sk ) ;
void ( * ccid_hc_tx_exit ) ( struct sock * sk ) ;
2005-08-14 03:34:54 +04:00
void ( * ccid_hc_rx_packet_recv ) ( struct sock * sk ,
struct sk_buff * skb ) ;
2010-09-19 22:06:50 +04:00
int ( * ccid_hc_rx_parse_options ) ( struct sock * sk , u8 pkt ,
u8 opt , u8 * val , u8 len ) ;
2006-03-21 09:32:06 +03:00
int ( * ccid_hc_rx_insert_options ) ( struct sock * sk ,
2005-08-14 03:34:54 +04:00
struct sk_buff * skb ) ;
void ( * ccid_hc_tx_packet_recv ) ( struct sock * sk ,
struct sk_buff * skb ) ;
2010-09-19 22:06:50 +04:00
int ( * ccid_hc_tx_parse_options ) ( struct sock * sk , u8 pkt ,
u8 opt , u8 * val , u8 len ) ;
2005-08-10 07:14:34 +04:00
int ( * ccid_hc_tx_send_packet ) ( struct sock * sk ,
2006-11-29 00:55:06 +03:00
struct sk_buff * skb ) ;
void ( * ccid_hc_tx_packet_sent ) ( struct sock * sk ,
2010-10-11 22:37:38 +04:00
unsigned int len ) ;
[DCCP]: Introduce dccp_get_info
And also hc_tx and hc_rx get_info functions for the CCIDs to fill in
information that is specific to them.
For now reusing struct tcp_info, later I'll try to figure out a better
solution, for now its really nice to get this kind of info:
[root@qemu ~]# ./ss -danemi
State Recv-Q Send-Q Local Addr:Port Peer Addr:Port
LISTEN 0 0 *:5001 *:* ino:628 sk:c1340040
mem:(r0,w0,f0,t0) cwnd:0 ssthresh:0
ESTAB 0 0 172.20.0.2:5001 172.20.0.1:32785 ino:629 sk:c13409a0
mem:(r0,w0,f0,t0) ts rto:1000 rtt:0.004/0 cwnd:0 ssthresh:0 rcv_rtt:61.377
This, for instance, shows that we're not congestion controlling ACKs,
as the above output is in the ttcp receiving host, and ttcp is a one
way app, i.e. the received never calls sendmsg, so
ccid_hc_tx_send_packet is never called, so the TX half connection
stays in TFRC_SSTATE_NO_SENT state and hctx_rtt is never calculated,
stays with the value set in ccid3_hc_tx_init, 4us, as show above in
milliseconds (0.004ms), upcoming patches will fix this.
rcv_rtt seems sane tho, matching ping results :-)
Signed-off-by: Arnaldo Carvalho de Melo <acme@mandriva.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2005-08-24 08:52:35 +04:00
void ( * ccid_hc_rx_get_info ) ( struct sock * sk ,
struct tcp_info * info ) ;
void ( * ccid_hc_tx_get_info ) ( struct sock * sk ,
struct tcp_info * info ) ;
2005-09-18 11:19:32 +04:00
int ( * ccid_hc_rx_getsockopt ) ( struct sock * sk ,
const int optname , int len ,
u32 __user * optval ,
int __user * optlen ) ;
int ( * ccid_hc_tx_getsockopt ) ( struct sock * sk ,
const int optname , int len ,
u32 __user * optval ,
int __user * optlen ) ;
2005-08-10 07:14:34 +04:00
} ;
2009-01-05 08:42:53 +03:00
extern struct ccid_operations ccid2_ops ;
# ifdef CONFIG_IP_DCCP_CCID3
extern struct ccid_operations ccid3_ops ;
# endif
extern int ccid_initialize_builtins ( void ) ;
extern void ccid_cleanup_builtins ( void ) ;
2005-08-10 07:14:34 +04:00
2006-03-21 06:21:44 +03:00
struct ccid {
struct ccid_operations * ccid_ops ;
char ccid_priv [ 0 ] ;
} ;
2005-08-10 07:14:34 +04:00
2006-03-21 06:21:44 +03:00
static inline void * ccid_priv ( const struct ccid * ccid )
2005-08-10 07:14:34 +04:00
{
2006-03-21 06:21:44 +03:00
return ( void * ) ccid - > ccid_priv ;
2005-08-10 07:14:34 +04:00
}
2008-11-12 11:47:26 +03:00
extern bool ccid_support_check ( u8 const * ccid_array , u8 array_len ) ;
extern int ccid_get_builtin_ccids ( u8 * * ccid_array , u8 * array_len ) ;
extern int ccid_getsockopt_builtin_ccids ( struct sock * sk , int len ,
char __user * , int __user * ) ;
2009-01-05 08:43:23 +03:00
extern struct ccid * ccid_new ( const u8 id , struct sock * sk , bool rx ) ;
2006-03-21 06:21:44 +03:00
2008-11-24 03:04:59 +03:00
static inline int ccid_get_current_rx_ccid ( struct dccp_sock * dp )
{
struct ccid * ccid = dp - > dccps_hc_rx_ccid ;
if ( ccid = = NULL | | ccid - > ccid_ops = = NULL )
return - 1 ;
return ccid - > ccid_ops - > ccid_id ;
}
static inline int ccid_get_current_tx_ccid ( struct dccp_sock * dp )
{
struct ccid * ccid = dp - > dccps_hc_tx_ccid ;
if ( ccid = = NULL | | ccid - > ccid_ops = = NULL )
return - 1 ;
return ccid - > ccid_ops - > ccid_id ;
}
2006-03-21 06:21:44 +03:00
extern void ccid_hc_rx_delete ( struct ccid * ccid , struct sock * sk ) ;
extern void ccid_hc_tx_delete ( struct ccid * ccid , struct sock * sk ) ;
2010-10-27 23:16:25 +04:00
/*
* Congestion control of queued data packets via CCID decision .
*
* The TX CCID performs its congestion - control by indicating whether and when a
* queued packet may be sent , using the return code of ccid_hc_tx_send_packet ( ) .
* The following modes are supported via the symbolic constants below :
* - timer - based pacing ( CCID returns a delay value in milliseconds ) ;
* - autonomous dequeueing ( CCID internally schedules dccps_xmitlet ) .
*/
enum ccid_dequeueing_decision {
CCID_PACKET_SEND_AT_ONCE = 0x00000 , /* "green light": no delay */
CCID_PACKET_DELAY_MAX = 0x0FFFF , /* maximum delay in msecs */
CCID_PACKET_DELAY = 0x10000 , /* CCID msec-delay mode */
CCID_PACKET_WILL_DEQUEUE_LATER = 0x20000 , /* CCID autonomous mode */
CCID_PACKET_ERR = 0xF0000 , /* error condition */
} ;
static inline int ccid_packet_dequeue_eval ( const int return_code )
{
if ( return_code < 0 )
return CCID_PACKET_ERR ;
if ( return_code = = 0 )
return CCID_PACKET_SEND_AT_ONCE ;
if ( return_code < = CCID_PACKET_DELAY_MAX )
return CCID_PACKET_DELAY ;
return return_code ;
}
2005-08-10 07:14:34 +04:00
static inline int ccid_hc_tx_send_packet ( struct ccid * ccid , struct sock * sk ,
2006-11-29 00:55:06 +03:00
struct sk_buff * skb )
2005-08-10 07:14:34 +04:00
{
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_tx_send_packet ! = NULL )
2010-10-27 23:16:25 +04:00
return ccid - > ccid_ops - > ccid_hc_tx_send_packet ( sk , skb ) ;
return CCID_PACKET_SEND_AT_ONCE ;
2005-08-10 07:14:34 +04:00
}
static inline void ccid_hc_tx_packet_sent ( struct ccid * ccid , struct sock * sk ,
2010-10-11 22:37:38 +04:00
unsigned int len )
2005-08-10 07:14:34 +04:00
{
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_tx_packet_sent ! = NULL )
2010-10-11 22:37:38 +04:00
ccid - > ccid_ops - > ccid_hc_tx_packet_sent ( sk , len ) ;
2005-08-10 07:14:34 +04:00
}
static inline void ccid_hc_rx_packet_recv ( struct ccid * ccid , struct sock * sk ,
struct sk_buff * skb )
{
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_rx_packet_recv ! = NULL )
ccid - > ccid_ops - > ccid_hc_rx_packet_recv ( sk , skb ) ;
2005-08-10 07:14:34 +04:00
}
static inline void ccid_hc_tx_packet_recv ( struct ccid * ccid , struct sock * sk ,
struct sk_buff * skb )
{
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_tx_packet_recv ! = NULL )
ccid - > ccid_ops - > ccid_hc_tx_packet_recv ( sk , skb ) ;
2005-08-10 07:14:34 +04:00
}
2010-09-19 22:06:50 +04:00
/**
* ccid_hc_tx_parse_options - Parse CCID - specific options sent by the receiver
* @ pkt : type of packet that @ opt appears on ( RFC 4340 , 5.1 )
* @ opt : the CCID - specific option type ( RFC 4340 , 5.8 and 10.3 )
* @ val : value of @ opt
* @ len : length of @ val in bytes
*/
2005-08-10 07:14:34 +04:00
static inline int ccid_hc_tx_parse_options ( struct ccid * ccid , struct sock * sk ,
2010-09-19 22:06:50 +04:00
u8 pkt , u8 opt , u8 * val , u8 len )
2005-08-10 07:14:34 +04:00
{
2010-09-19 22:06:50 +04:00
if ( ccid - > ccid_ops - > ccid_hc_tx_parse_options = = NULL )
return 0 ;
return ccid - > ccid_ops - > ccid_hc_tx_parse_options ( sk , pkt , opt , val , len ) ;
2005-08-10 07:14:34 +04:00
}
2010-09-19 22:06:50 +04:00
/**
* ccid_hc_rx_parse_options - Parse CCID - specific options sent by the sender
* Arguments are analogous to ccid_hc_tx_parse_options ( )
*/
2005-08-10 07:14:34 +04:00
static inline int ccid_hc_rx_parse_options ( struct ccid * ccid , struct sock * sk ,
2010-09-19 22:06:50 +04:00
u8 pkt , u8 opt , u8 * val , u8 len )
2005-08-10 07:14:34 +04:00
{
2010-09-19 22:06:50 +04:00
if ( ccid - > ccid_ops - > ccid_hc_rx_parse_options = = NULL )
return 0 ;
return ccid - > ccid_ops - > ccid_hc_rx_parse_options ( sk , pkt , opt , val , len ) ;
2005-08-10 07:14:34 +04:00
}
2006-03-21 09:32:06 +03:00
static inline int ccid_hc_rx_insert_options ( struct ccid * ccid , struct sock * sk ,
struct sk_buff * skb )
2005-08-10 07:14:34 +04:00
{
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_rx_insert_options ! = NULL )
2006-03-21 09:32:06 +03:00
return ccid - > ccid_ops - > ccid_hc_rx_insert_options ( sk , skb ) ;
return 0 ;
2005-08-10 07:14:34 +04:00
}
[DCCP]: Introduce dccp_get_info
And also hc_tx and hc_rx get_info functions for the CCIDs to fill in
information that is specific to them.
For now reusing struct tcp_info, later I'll try to figure out a better
solution, for now its really nice to get this kind of info:
[root@qemu ~]# ./ss -danemi
State Recv-Q Send-Q Local Addr:Port Peer Addr:Port
LISTEN 0 0 *:5001 *:* ino:628 sk:c1340040
mem:(r0,w0,f0,t0) cwnd:0 ssthresh:0
ESTAB 0 0 172.20.0.2:5001 172.20.0.1:32785 ino:629 sk:c13409a0
mem:(r0,w0,f0,t0) ts rto:1000 rtt:0.004/0 cwnd:0 ssthresh:0 rcv_rtt:61.377
This, for instance, shows that we're not congestion controlling ACKs,
as the above output is in the ttcp receiving host, and ttcp is a one
way app, i.e. the received never calls sendmsg, so
ccid_hc_tx_send_packet is never called, so the TX half connection
stays in TFRC_SSTATE_NO_SENT state and hctx_rtt is never calculated,
stays with the value set in ccid3_hc_tx_init, 4us, as show above in
milliseconds (0.004ms), upcoming patches will fix this.
rcv_rtt seems sane tho, matching ping results :-)
Signed-off-by: Arnaldo Carvalho de Melo <acme@mandriva.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2005-08-24 08:52:35 +04:00
static inline void ccid_hc_rx_get_info ( struct ccid * ccid , struct sock * sk ,
struct tcp_info * info )
{
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_rx_get_info ! = NULL )
ccid - > ccid_ops - > ccid_hc_rx_get_info ( sk , info ) ;
[DCCP]: Introduce dccp_get_info
And also hc_tx and hc_rx get_info functions for the CCIDs to fill in
information that is specific to them.
For now reusing struct tcp_info, later I'll try to figure out a better
solution, for now its really nice to get this kind of info:
[root@qemu ~]# ./ss -danemi
State Recv-Q Send-Q Local Addr:Port Peer Addr:Port
LISTEN 0 0 *:5001 *:* ino:628 sk:c1340040
mem:(r0,w0,f0,t0) cwnd:0 ssthresh:0
ESTAB 0 0 172.20.0.2:5001 172.20.0.1:32785 ino:629 sk:c13409a0
mem:(r0,w0,f0,t0) ts rto:1000 rtt:0.004/0 cwnd:0 ssthresh:0 rcv_rtt:61.377
This, for instance, shows that we're not congestion controlling ACKs,
as the above output is in the ttcp receiving host, and ttcp is a one
way app, i.e. the received never calls sendmsg, so
ccid_hc_tx_send_packet is never called, so the TX half connection
stays in TFRC_SSTATE_NO_SENT state and hctx_rtt is never calculated,
stays with the value set in ccid3_hc_tx_init, 4us, as show above in
milliseconds (0.004ms), upcoming patches will fix this.
rcv_rtt seems sane tho, matching ping results :-)
Signed-off-by: Arnaldo Carvalho de Melo <acme@mandriva.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2005-08-24 08:52:35 +04:00
}
static inline void ccid_hc_tx_get_info ( struct ccid * ccid , struct sock * sk ,
struct tcp_info * info )
{
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_tx_get_info ! = NULL )
ccid - > ccid_ops - > ccid_hc_tx_get_info ( sk , info ) ;
[DCCP]: Introduce dccp_get_info
And also hc_tx and hc_rx get_info functions for the CCIDs to fill in
information that is specific to them.
For now reusing struct tcp_info, later I'll try to figure out a better
solution, for now its really nice to get this kind of info:
[root@qemu ~]# ./ss -danemi
State Recv-Q Send-Q Local Addr:Port Peer Addr:Port
LISTEN 0 0 *:5001 *:* ino:628 sk:c1340040
mem:(r0,w0,f0,t0) cwnd:0 ssthresh:0
ESTAB 0 0 172.20.0.2:5001 172.20.0.1:32785 ino:629 sk:c13409a0
mem:(r0,w0,f0,t0) ts rto:1000 rtt:0.004/0 cwnd:0 ssthresh:0 rcv_rtt:61.377
This, for instance, shows that we're not congestion controlling ACKs,
as the above output is in the ttcp receiving host, and ttcp is a one
way app, i.e. the received never calls sendmsg, so
ccid_hc_tx_send_packet is never called, so the TX half connection
stays in TFRC_SSTATE_NO_SENT state and hctx_rtt is never calculated,
stays with the value set in ccid3_hc_tx_init, 4us, as show above in
milliseconds (0.004ms), upcoming patches will fix this.
rcv_rtt seems sane tho, matching ping results :-)
Signed-off-by: Arnaldo Carvalho de Melo <acme@mandriva.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2005-08-24 08:52:35 +04:00
}
2005-09-18 11:19:32 +04:00
static inline int ccid_hc_rx_getsockopt ( struct ccid * ccid , struct sock * sk ,
const int optname , int len ,
u32 __user * optval , int __user * optlen )
{
int rc = - ENOPROTOOPT ;
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_rx_getsockopt ! = NULL )
rc = ccid - > ccid_ops - > ccid_hc_rx_getsockopt ( sk , optname , len ,
2005-09-18 11:19:32 +04:00
optval , optlen ) ;
return rc ;
}
static inline int ccid_hc_tx_getsockopt ( struct ccid * ccid , struct sock * sk ,
const int optname , int len ,
u32 __user * optval , int __user * optlen )
{
int rc = - ENOPROTOOPT ;
2006-03-21 06:21:44 +03:00
if ( ccid - > ccid_ops - > ccid_hc_tx_getsockopt ! = NULL )
rc = ccid - > ccid_ops - > ccid_hc_tx_getsockopt ( sk , optname , len ,
2005-09-18 11:19:32 +04:00
optval , optlen ) ;
return rc ;
}
2005-08-10 07:14:34 +04:00
# endif /* _CCID_H */