2005-04-16 15:20:36 -07:00
# ifndef _NET_NEIGHBOUR_H
# define _NET_NEIGHBOUR_H
2006-08-07 17:57:44 -07:00
# include <linux/neighbour.h>
2005-04-16 15:20:36 -07:00
/*
* Generic neighbour manipulation
*
* Authors :
* Pedro Roque < roque @ di . fc . ul . pt >
* Alexey Kuznetsov < kuznet @ ms2 . inr . ac . ru >
*
* Changes :
*
* Harald Welte : < laforge @ gnumonks . org >
* - Add neighbour cache statistics like rtstat
*/
# include <asm/atomic.h>
# include <linux/netdevice.h>
2005-12-27 02:43:12 -02:00
# include <linux/skbuff.h>
2005-04-16 15:20:36 -07:00
# include <linux/rcupdate.h>
# include <linux/seq_file.h>
# include <linux/err.h>
# include <linux/sysctl.h>
2009-07-30 03:15:07 +00:00
# include <linux/workqueue.h>
2007-03-22 11:50:06 -07:00
# include <net/rtnetlink.h>
2005-04-16 15:20:36 -07:00
2008-01-10 22:37:16 -08:00
/*
* NUD stands for " neighbor unreachability detection "
*/
2005-04-16 15:20:36 -07:00
# define NUD_IN_TIMER (NUD_INCOMPLETE|NUD_REACHABLE|NUD_DELAY|NUD_PROBE)
# define NUD_VALID (NUD_PERMANENT|NUD_NOARP|NUD_REACHABLE|NUD_PROBE|NUD_STALE|NUD_DELAY)
# define NUD_CONNECTED (NUD_PERMANENT|NUD_NOARP|NUD_REACHABLE)
struct neighbour ;
2009-11-03 03:26:03 +00:00
struct neigh_parms {
2008-03-26 03:49:59 +09:00
# ifdef CONFIG_NET_NS
2008-01-24 00:13:18 -08:00
struct net * net ;
2008-03-26 03:49:59 +09:00
# endif
2005-06-18 22:50:55 -07:00
struct net_device * dev ;
2005-04-16 15:20:36 -07:00
struct neigh_parms * next ;
int ( * neigh_setup ) ( struct neighbour * ) ;
2007-03-24 12:52:16 -07:00
void ( * neigh_cleanup ) ( struct neighbour * ) ;
2005-04-16 15:20:36 -07:00
struct neigh_table * tbl ;
void * sysctl_table ;
int dead ;
atomic_t refcnt ;
struct rcu_head rcu_head ;
int base_reachable_time ;
int retrans_time ;
int gc_staletime ;
int reachable_time ;
int delay_probe_time ;
int queue_len ;
int ucast_probes ;
int app_probes ;
int mcast_probes ;
int anycast_delay ;
int proxy_delay ;
int proxy_qlen ;
int locktime ;
} ;
2009-11-03 03:26:03 +00:00
struct neigh_statistics {
2005-04-16 15:20:36 -07:00
unsigned long allocs ; /* number of allocated neighs */
unsigned long destroys ; /* number of destroyed neighs */
unsigned long hash_grows ; /* number of hash resizes */
2008-07-16 20:50:49 -07:00
unsigned long res_failed ; /* number of failed resolutions */
2005-04-16 15:20:36 -07:00
unsigned long lookups ; /* number of lookups */
unsigned long hits ; /* number of hits (among lookups) */
unsigned long rcv_probes_mcast ; /* number of received mcast ipv6 */
unsigned long rcv_probes_ucast ; /* number of received ucast ipv6 */
unsigned long periodic_gc_runs ; /* number of periodic GC runs */
unsigned long forced_gc_runs ; /* number of forced GC runs */
2008-07-16 20:50:49 -07:00
unsigned long unres_discards ; /* number of unresolved drops */
2005-04-16 15:20:36 -07:00
} ;
2009-10-03 19:48:22 +09:00
# define NEIGH_CACHE_STAT_INC(tbl, field) this_cpu_inc((tbl)->stats->field)
2005-04-16 15:20:36 -07:00
2009-11-03 03:26:03 +00:00
struct neighbour {
2010-10-06 17:49:21 -07:00
struct neighbour __rcu * next ;
2005-04-16 15:20:36 -07:00
struct neigh_table * tbl ;
struct neigh_parms * parms ;
unsigned long confirmed ;
unsigned long updated ;
2010-11-11 06:57:19 +00:00
rwlock_t lock ;
2010-09-30 05:36:29 +00:00
atomic_t refcnt ;
neigh: reorder struct neighbour fields
Le mardi 12 octobre 2010 à 00:02 +0200, Eric Dumazet a écrit :
> Here is the followup patch.
>
> Thanks !
>
Oops, this was an old version, the up2date ones also took care of "used"
field.
I guess its time for a sleep, sorry again.
[PATCH net-next V2] neigh: reorder struct neighbour fields
(refcnt) and (ha_lock, ha, used, dev, output, ops, primary_key) should
be placed on a separate cache lines.
refcnt can be often written, while other fields are mostly read.
This gave me good result on stress test :
before:
real 0m45.570s
user 0m15.525s
sys 9m56.669s
After:
real 0m41.841s
user 0m15.261s
sys 8m45.949s
Signed-off-by: Eric Dumazet <eric.dumazet@gmail.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2010-10-11 12:20:54 +00:00
struct sk_buff_head arp_queue ;
struct timer_list timer ;
unsigned long used ;
2005-04-16 15:20:36 -07:00
atomic_t probes ;
2010-11-11 06:57:19 +00:00
__u8 flags ;
__u8 nud_state ;
__u8 type ;
__u8 dead ;
2010-10-07 10:44:07 +00:00
seqlock_t ha_lock ;
2006-08-10 23:03:23 -07:00
unsigned char ha [ ALIGN ( MAX_ADDR_LEN , sizeof ( unsigned long ) ) ] ;
2005-04-16 15:20:36 -07:00
struct hh_cache * hh ;
int ( * output ) ( struct sk_buff * skb ) ;
2009-09-01 11:13:19 +00:00
const struct neigh_ops * ops ;
2010-10-06 17:49:21 -07:00
struct rcu_head rcu ;
neigh: reorder struct neighbour fields
Le mardi 12 octobre 2010 à 00:02 +0200, Eric Dumazet a écrit :
> Here is the followup patch.
>
> Thanks !
>
Oops, this was an old version, the up2date ones also took care of "used"
field.
I guess its time for a sleep, sorry again.
[PATCH net-next V2] neigh: reorder struct neighbour fields
(refcnt) and (ha_lock, ha, used, dev, output, ops, primary_key) should
be placed on a separate cache lines.
refcnt can be often written, while other fields are mostly read.
This gave me good result on stress test :
before:
real 0m45.570s
user 0m15.525s
sys 9m56.669s
After:
real 0m41.841s
user 0m15.261s
sys 8m45.949s
Signed-off-by: Eric Dumazet <eric.dumazet@gmail.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2010-10-11 12:20:54 +00:00
struct net_device * dev ;
2005-04-16 15:20:36 -07:00
u8 primary_key [ 0 ] ;
} ;
2009-11-03 03:26:03 +00:00
struct neigh_ops {
2005-04-16 15:20:36 -07:00
int family ;
void ( * solicit ) ( struct neighbour * , struct sk_buff * ) ;
void ( * error_report ) ( struct neighbour * , struct sk_buff * ) ;
int ( * output ) ( struct sk_buff * ) ;
int ( * connected_output ) ( struct sk_buff * ) ;
int ( * hh_output ) ( struct sk_buff * ) ;
int ( * queue_xmit ) ( struct sk_buff * ) ;
} ;
2009-11-03 03:26:03 +00:00
struct pneigh_entry {
2005-04-16 15:20:36 -07:00
struct pneigh_entry * next ;
2008-03-26 03:49:59 +09:00
# ifdef CONFIG_NET_NS
2008-01-24 00:13:18 -08:00
struct net * net ;
2008-03-26 03:49:59 +09:00
# endif
2008-01-24 00:13:18 -08:00
struct net_device * dev ;
2006-09-22 14:43:19 -07:00
u8 flags ;
2005-04-16 15:20:36 -07:00
u8 key [ 0 ] ;
} ;
/*
* neighbour table manipulation
*/
2010-10-04 06:15:44 +00:00
struct neigh_hash_table {
2010-10-06 17:49:21 -07:00
struct neighbour __rcu * * hash_buckets ;
2010-10-04 06:15:44 +00:00
unsigned int hash_mask ;
__u32 hash_rnd ;
struct rcu_head rcu ;
} ;
2005-04-16 15:20:36 -07:00
2009-11-03 03:26:03 +00:00
struct neigh_table {
2005-04-16 15:20:36 -07:00
struct neigh_table * next ;
int family ;
int entry_size ;
int key_len ;
2010-10-04 06:15:44 +00:00
__u32 ( * hash ) ( const void * pkey ,
const struct net_device * dev ,
__u32 hash_rnd ) ;
2005-04-16 15:20:36 -07:00
int ( * constructor ) ( struct neighbour * ) ;
int ( * pconstructor ) ( struct pneigh_entry * ) ;
void ( * pdestructor ) ( struct pneigh_entry * ) ;
void ( * proxy_redo ) ( struct sk_buff * skb ) ;
char * id ;
struct neigh_parms parms ;
2010-06-30 06:08:15 +00:00
/* HACK. gc_* should follow parms without a gap! */
2005-04-16 15:20:36 -07:00
int gc_interval ;
int gc_thresh1 ;
int gc_thresh2 ;
int gc_thresh3 ;
unsigned long last_flush ;
2009-07-30 03:15:07 +00:00
struct delayed_work gc_work ;
2005-04-16 15:20:36 -07:00
struct timer_list proxy_timer ;
struct sk_buff_head proxy_queue ;
atomic_t entries ;
rwlock_t lock ;
unsigned long last_rand ;
2010-09-30 05:36:29 +00:00
struct kmem_cache * kmem_cachep ;
2010-02-16 15:20:26 +00:00
struct neigh_statistics __percpu * stats ;
2010-10-04 06:15:44 +00:00
struct neigh_hash_table __rcu * nht ;
2005-04-16 15:20:36 -07:00
struct pneigh_entry * * phash_buckets ;
} ;
/* flags for neigh_update() */
# define NEIGH_UPDATE_F_OVERRIDE 0x00000001
# define NEIGH_UPDATE_F_WEAK_OVERRIDE 0x00000002
# define NEIGH_UPDATE_F_OVERRIDE_ISROUTER 0x00000004
# define NEIGH_UPDATE_F_ISROUTER 0x40000000
# define NEIGH_UPDATE_F_ADMIN 0x80000000
extern void neigh_table_init ( struct neigh_table * tbl ) ;
[NEIGH]: Fix IP-over-ATM and ARP interaction.
The classical IP over ATM code maintains its own IPv4 <-> <ATM stuff>
ARP table, using the standard neighbour-table code. The
neigh_table_init function adds this neighbour table to a linked list
of all neighbor tables which is used by the functions neigh_delete()
neigh_add() and neightbl_set(), all called by the netlink code.
Once the ATM neighbour table is added to the list, there are two
tables with family == AF_INET there, and ARP entries sent via netlink
go into the first table with matching family. This is indeterminate
and often wrong.
To see the bug, on a kernel with CLIP enabled, create a standard IPv4
ARP entry by pinging an unused address on a local subnet. Then attempt
to complete that entry by doing
ip neigh replace <ip address> lladdr <some mac address> nud reachable
Looking at the ARP tables by using
ip neigh show
will reveal two ARP entries for the same address. One of these can be
found in /proc/net/arp, and the other in /proc/net/atm/arp.
This patch adds a new function, neigh_table_init_no_netlink() which
does everything the neigh_table_init() does, except add the table to
the netlink all-arp-tables chain. In addition neigh_table_init() has a
check that all tables on the chain have a distinct address family.
The init call in clip.c is changed to call
neigh_table_init_no_netlink().
Since ATM ARP tables are rather more complicated than can currently be
handled by the available rtattrs in the netlink protocol, no
functionality is lost by this patch, and non-ATM ARP manipulation via
netlink is rescued. A more complete solution would involve a rtattr
for ATM ARP entries and some way for the netlink code to give
neigh_add and friends more information than just address family with
which to find the correct ARP table.
[ I've changed the assertion checking in neigh_table_init() to not
use BUG_ON() while holding neigh_tbl_lock. Instead we remember that
we found an existing tbl with the same family, and after dropping
the lock we'll give a diagnostic kernel log message and a stack dump.
-DaveM ]
Signed-off-by: Simon Kelley <simon@thekelleys.org.uk>
Signed-off-by: David S. Miller <davem@davemloft.net>
2006-05-12 14:56:08 -07:00
extern void neigh_table_init_no_netlink ( struct neigh_table * tbl ) ;
2005-04-16 15:20:36 -07:00
extern int neigh_table_clear ( struct neigh_table * tbl ) ;
extern struct neighbour * neigh_lookup ( struct neigh_table * tbl ,
const void * pkey ,
struct net_device * dev ) ;
extern struct neighbour * neigh_lookup_nodev ( struct neigh_table * tbl ,
2008-01-24 00:13:18 -08:00
struct net * net ,
2005-04-16 15:20:36 -07:00
const void * pkey ) ;
extern struct neighbour * neigh_create ( struct neigh_table * tbl ,
const void * pkey ,
struct net_device * dev ) ;
extern void neigh_destroy ( struct neighbour * neigh ) ;
extern int __neigh_event_send ( struct neighbour * neigh , struct sk_buff * skb ) ;
extern int neigh_update ( struct neighbour * neigh , const u8 * lladdr , u8 new ,
u32 flags ) ;
extern void neigh_changeaddr ( struct neigh_table * tbl , struct net_device * dev ) ;
extern int neigh_ifdown ( struct neigh_table * tbl , struct net_device * dev ) ;
extern int neigh_resolve_output ( struct sk_buff * skb ) ;
extern int neigh_connected_output ( struct sk_buff * skb ) ;
extern int neigh_compat_output ( struct sk_buff * skb ) ;
extern struct neighbour * neigh_event_ns ( struct neigh_table * tbl ,
u8 * lladdr , void * saddr ,
struct net_device * dev ) ;
extern struct neigh_parms * neigh_parms_alloc ( struct net_device * dev , struct neigh_table * tbl ) ;
extern void neigh_parms_release ( struct neigh_table * tbl , struct neigh_parms * parms ) ;
2008-03-26 03:49:59 +09:00
static inline
struct net * neigh_parms_net ( const struct neigh_parms * parms )
{
2008-11-12 00:54:54 -08:00
return read_pnet ( & parms - > net ) ;
2008-03-26 03:49:59 +09:00
}
2005-04-16 15:20:36 -07:00
extern unsigned long neigh_rand_reach_time ( unsigned long base ) ;
extern void pneigh_enqueue ( struct neigh_table * tbl , struct neigh_parms * p ,
struct sk_buff * skb ) ;
2008-01-24 00:13:18 -08:00
extern struct pneigh_entry * pneigh_lookup ( struct neigh_table * tbl , struct net * net , const void * key , struct net_device * dev , int creat ) ;
2008-03-24 14:48:59 -07:00
extern struct pneigh_entry * __pneigh_lookup ( struct neigh_table * tbl ,
struct net * net ,
const void * key ,
struct net_device * dev ) ;
2008-01-24 00:13:18 -08:00
extern int pneigh_delete ( struct neigh_table * tbl , struct net * net , const void * key , struct net_device * dev ) ;
2005-04-16 15:20:36 -07:00
2008-03-26 03:49:59 +09:00
static inline
struct net * pneigh_net ( const struct pneigh_entry * pneigh )
{
2008-11-12 00:54:54 -08:00
return read_pnet ( & pneigh - > net ) ;
2008-03-26 03:49:59 +09:00
}
2005-04-16 15:20:36 -07:00
extern void neigh_app_ns ( struct neighbour * n ) ;
extern void neigh_for_each ( struct neigh_table * tbl , void ( * cb ) ( struct neighbour * , void * ) , void * cookie ) ;
extern void __neigh_for_each_release ( struct neigh_table * tbl , int ( * cb ) ( struct neighbour * ) ) ;
extern void pneigh_for_each ( struct neigh_table * tbl , void ( * cb ) ( struct pneigh_entry * ) ) ;
struct neigh_seq_state {
2008-01-10 03:53:12 -08:00
struct seq_net_private p ;
2005-04-16 15:20:36 -07:00
struct neigh_table * tbl ;
2010-10-04 06:15:44 +00:00
struct neigh_hash_table * nht ;
2005-04-16 15:20:36 -07:00
void * ( * neigh_sub_iter ) ( struct neigh_seq_state * state ,
struct neighbour * n , loff_t * pos ) ;
unsigned int bucket ;
unsigned int flags ;
# define NEIGH_SEQ_NEIGH_ONLY 0x00000001
# define NEIGH_SEQ_IS_PNEIGH 0x00000002
# define NEIGH_SEQ_SKIP_NOARP 0x00000004
} ;
extern void * neigh_seq_start ( struct seq_file * , loff_t * , struct neigh_table * , unsigned int ) ;
extern void * neigh_seq_next ( struct seq_file * , void * , loff_t * ) ;
extern void neigh_seq_stop ( struct seq_file * , void * ) ;
extern int neigh_sysctl_register ( struct net_device * dev ,
struct neigh_parms * p ,
char * p_name ,
2009-11-05 13:32:03 -08:00
proc_handler * proc_handler ) ;
2005-04-16 15:20:36 -07:00
extern void neigh_sysctl_unregister ( struct neigh_parms * p ) ;
static inline void __neigh_parms_put ( struct neigh_parms * parms )
{
atomic_dec ( & parms - > refcnt ) ;
}
static inline struct neigh_parms * neigh_parms_clone ( struct neigh_parms * parms )
{
atomic_inc ( & parms - > refcnt ) ;
return parms ;
}
/*
* Neighbour references
*/
static inline void neigh_release ( struct neighbour * neigh )
{
if ( atomic_dec_and_test ( & neigh - > refcnt ) )
neigh_destroy ( neigh ) ;
}
static inline struct neighbour * neigh_clone ( struct neighbour * neigh )
{
if ( neigh )
atomic_inc ( & neigh - > refcnt ) ;
return neigh ;
}
# define neigh_hold(n) atomic_inc(&(n)->refcnt)
static inline void neigh_confirm ( struct neighbour * neigh )
{
if ( neigh )
neigh - > confirmed = jiffies ;
}
static inline int neigh_event_send ( struct neighbour * neigh , struct sk_buff * skb )
{
2010-11-18 09:40:04 -08:00
unsigned long now = jiffies ;
2010-10-07 10:44:07 +00:00
if ( neigh - > used ! = now )
neigh - > used = now ;
2005-04-16 15:20:36 -07:00
if ( ! ( neigh - > nud_state & ( NUD_CONNECTED | NUD_DELAY | NUD_PROBE ) ) )
return __neigh_event_send ( neigh , skb ) ;
return 0 ;
}
2010-04-15 12:26:39 +02:00
# ifdef CONFIG_BRIDGE_NETFILTER
static inline int neigh_hh_bridge ( struct hh_cache * hh , struct sk_buff * skb )
{
unsigned seq , hh_alen ;
do {
seq = read_seqbegin ( & hh - > hh_lock ) ;
hh_alen = HH_DATA_ALIGN ( ETH_HLEN ) ;
memcpy ( skb - > data - hh_alen , hh - > hh_data , ETH_ALEN + hh_alen - ETH_HLEN ) ;
} while ( read_seqretry ( & hh - > hh_lock , seq ) ) ;
return 0 ;
}
# endif
2006-12-07 15:08:17 -08:00
static inline int neigh_hh_output ( struct hh_cache * hh , struct sk_buff * skb )
{
unsigned seq ;
int hh_len ;
do {
int hh_alen ;
seq = read_seqbegin ( & hh - > hh_lock ) ;
hh_len = hh - > hh_len ;
hh_alen = HH_DATA_ALIGN ( hh_len ) ;
memcpy ( skb - > data - hh_alen , hh - > hh_data , hh_alen ) ;
} while ( read_seqretry ( & hh - > hh_lock , seq ) ) ;
skb_push ( skb , hh_len ) ;
return hh - > hh_output ( skb ) ;
}
2005-04-16 15:20:36 -07:00
static inline struct neighbour *
__neigh_lookup ( struct neigh_table * tbl , const void * pkey , struct net_device * dev , int creat )
{
struct neighbour * n = neigh_lookup ( tbl , pkey , dev ) ;
if ( n | | ! creat )
return n ;
n = neigh_create ( tbl , pkey , dev ) ;
return IS_ERR ( n ) ? NULL : n ;
}
static inline struct neighbour *
__neigh_lookup_errno ( struct neigh_table * tbl , const void * pkey ,
struct net_device * dev )
{
struct neighbour * n = neigh_lookup ( tbl , pkey , dev ) ;
if ( n )
return n ;
return neigh_create ( tbl , pkey , dev ) ;
}
2005-08-14 17:24:31 -07:00
struct neighbour_cb {
unsigned long sched_next ;
unsigned int flags ;
} ;
# define LOCALLY_ENQUEUED 0x1
# define NEIGH_CB(skb) ((struct neighbour_cb *)(skb)->cb)
2005-04-16 15:20:36 -07:00
2010-10-07 10:44:07 +00:00
static inline void neigh_ha_snapshot ( char * dst , const struct neighbour * n ,
const struct net_device * dev )
{
unsigned int seq ;
do {
seq = read_seqbegin ( & n - > ha_lock ) ;
memcpy ( dst , n - > ha , dev - > addr_len ) ;
} while ( read_seqretry ( & n - > ha_lock , seq ) ) ;
}
2005-04-16 15:20:36 -07:00
# endif