2005-04-17 02:20:36 +04:00
/*
* Linux INET6 implementation
* FIB front - end .
*
* Authors :
* Pedro Roque < roque @ di . fc . ul . pt >
*
* $ Id : route . c , v 1.56 2001 / 10 / 31 21 : 55 : 55 davem Exp $
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation ; either version
* 2 of the License , or ( at your option ) any later version .
*/
/* Changes:
*
* YOSHIFUJI Hideaki @ USAGI
* reworked default router selection .
* - respect outgoing interface
* - select from ( probably ) reachable routers ( i . e .
* routers in REACHABLE , STALE , DELAY or PROBE states ) .
* - always select the same router if it is ( probably )
* reachable . otherwise , round - robin the list .
2006-08-24 04:23:25 +04:00
* Ville Nuorvala
* Fixed routing subtrees .
2005-04-17 02:20:36 +04:00
*/
2006-01-11 23:17:47 +03:00
# include <linux/capability.h>
2005-04-17 02:20:36 +04:00
# include <linux/errno.h>
# include <linux/types.h>
# include <linux/times.h>
# include <linux/socket.h>
# include <linux/sockios.h>
# include <linux/net.h>
# include <linux/route.h>
# include <linux/netdevice.h>
# include <linux/in6.h>
# include <linux/init.h>
# include <linux/if_arp.h>
# ifdef CONFIG_PROC_FS
# include <linux/proc_fs.h>
# include <linux/seq_file.h>
# endif
# include <net/snmp.h>
# include <net/ipv6.h>
# include <net/ip6_fib.h>
# include <net/ip6_route.h>
# include <net/ndisc.h>
# include <net/addrconf.h>
# include <net/tcp.h>
# include <linux/rtnetlink.h>
# include <net/dst.h>
# include <net/xfrm.h>
2006-07-31 07:43:36 +04:00
# include <net/netevent.h>
2006-08-15 11:35:24 +04:00
# include <net/netlink.h>
2005-04-17 02:20:36 +04:00
# include <asm/uaccess.h>
# ifdef CONFIG_SYSCTL
# include <linux/sysctl.h>
# endif
/* Set to 3 to get tracing. */
# define RT6_DEBUG 2
# if RT6_DEBUG >= 3
# define RDBG(x) printk x
# define RT6_TRACE(x...) printk(KERN_DEBUG x)
# else
# define RDBG(x)
# define RT6_TRACE(x...) do { ; } while (0)
# endif
2006-03-21 04:00:05 +03:00
# define CLONE_OFFLINK_ROUTE 0
2005-04-17 02:20:36 +04:00
static int ip6_rt_max_size = 4096 ;
static int ip6_rt_gc_min_interval = HZ / 2 ;
static int ip6_rt_gc_timeout = 60 * HZ ;
int ip6_rt_gc_interval = 30 * HZ ;
static int ip6_rt_gc_elasticity = 9 ;
static int ip6_rt_mtu_expires = 10 * 60 * HZ ;
static int ip6_rt_min_advmss = IPV6_MIN_MTU - 20 - 40 ;
static struct rt6_info * ip6_rt_copy ( struct rt6_info * ort ) ;
static struct dst_entry * ip6_dst_check ( struct dst_entry * dst , u32 cookie ) ;
static struct dst_entry * ip6_negative_advice ( struct dst_entry * ) ;
static void ip6_dst_destroy ( struct dst_entry * ) ;
static void ip6_dst_ifdown ( struct dst_entry * ,
struct net_device * dev , int how ) ;
static int ip6_dst_gc ( void ) ;
static int ip6_pkt_discard ( struct sk_buff * skb ) ;
static int ip6_pkt_discard_out ( struct sk_buff * skb ) ;
static void ip6_link_failure ( struct sk_buff * skb ) ;
static void ip6_rt_update_pmtu ( struct dst_entry * dst , u32 mtu ) ;
2006-03-21 04:06:24 +03:00
# ifdef CONFIG_IPV6_ROUTE_INFO
static struct rt6_info * rt6_add_route_info ( struct in6_addr * prefix , int prefixlen ,
struct in6_addr * gwaddr , int ifindex ,
unsigned pref ) ;
static struct rt6_info * rt6_get_route_info ( struct in6_addr * prefix , int prefixlen ,
struct in6_addr * gwaddr , int ifindex ) ;
# endif
2005-04-17 02:20:36 +04:00
static struct dst_ops ip6_dst_ops = {
. family = AF_INET6 ,
. protocol = __constant_htons ( ETH_P_IPV6 ) ,
. gc = ip6_dst_gc ,
. gc_thresh = 1024 ,
. check = ip6_dst_check ,
. destroy = ip6_dst_destroy ,
. ifdown = ip6_dst_ifdown ,
. negative_advice = ip6_negative_advice ,
. link_failure = ip6_link_failure ,
. update_pmtu = ip6_rt_update_pmtu ,
. entry_size = sizeof ( struct rt6_info ) ,
} ;
struct rt6_info ip6_null_entry = {
. u = {
. dst = {
. __refcnt = ATOMIC_INIT ( 1 ) ,
. __use = 1 ,
. dev = & loopback_dev ,
. obsolete = - 1 ,
. error = - ENETUNREACH ,
. metrics = { [ RTAX_HOPLIMIT - 1 ] = 255 , } ,
. input = ip6_pkt_discard ,
. output = ip6_pkt_discard_out ,
. ops = & ip6_dst_ops ,
. path = ( struct dst_entry * ) & ip6_null_entry ,
}
} ,
. rt6i_flags = ( RTF_REJECT | RTF_NONEXTHOP ) ,
. rt6i_metric = ~ ( u32 ) 0 ,
. rt6i_ref = ATOMIC_INIT ( 1 ) ,
} ;
2006-08-04 14:39:02 +04:00
# ifdef CONFIG_IPV6_MULTIPLE_TABLES
2006-10-19 08:20:57 +04:00
static int ip6_pkt_prohibit ( struct sk_buff * skb ) ;
static int ip6_pkt_prohibit_out ( struct sk_buff * skb ) ;
static int ip6_pkt_blk_hole ( struct sk_buff * skb ) ;
2006-08-04 14:39:02 +04:00
struct rt6_info ip6_prohibit_entry = {
. u = {
. dst = {
. __refcnt = ATOMIC_INIT ( 1 ) ,
. __use = 1 ,
. dev = & loopback_dev ,
. obsolete = - 1 ,
. error = - EACCES ,
. metrics = { [ RTAX_HOPLIMIT - 1 ] = 255 , } ,
2006-10-19 07:46:54 +04:00
. input = ip6_pkt_prohibit ,
. output = ip6_pkt_prohibit_out ,
2006-08-04 14:39:02 +04:00
. ops = & ip6_dst_ops ,
. path = ( struct dst_entry * ) & ip6_prohibit_entry ,
}
} ,
. rt6i_flags = ( RTF_REJECT | RTF_NONEXTHOP ) ,
. rt6i_metric = ~ ( u32 ) 0 ,
. rt6i_ref = ATOMIC_INIT ( 1 ) ,
} ;
struct rt6_info ip6_blk_hole_entry = {
. u = {
. dst = {
. __refcnt = ATOMIC_INIT ( 1 ) ,
. __use = 1 ,
. dev = & loopback_dev ,
. obsolete = - 1 ,
. error = - EINVAL ,
. metrics = { [ RTAX_HOPLIMIT - 1 ] = 255 , } ,
2006-10-19 07:46:54 +04:00
. input = ip6_pkt_blk_hole ,
. output = ip6_pkt_blk_hole ,
2006-08-04 14:39:02 +04:00
. ops = & ip6_dst_ops ,
. path = ( struct dst_entry * ) & ip6_blk_hole_entry ,
}
} ,
. rt6i_flags = ( RTF_REJECT | RTF_NONEXTHOP ) ,
. rt6i_metric = ~ ( u32 ) 0 ,
. rt6i_ref = ATOMIC_INIT ( 1 ) ,
} ;
# endif
2005-04-17 02:20:36 +04:00
/* allocate dst with ip6_dst_ops */
static __inline__ struct rt6_info * ip6_dst_alloc ( void )
{
return ( struct rt6_info * ) dst_alloc ( & ip6_dst_ops ) ;
}
static void ip6_dst_destroy ( struct dst_entry * dst )
{
struct rt6_info * rt = ( struct rt6_info * ) dst ;
struct inet6_dev * idev = rt - > rt6i_idev ;
if ( idev ! = NULL ) {
rt - > rt6i_idev = NULL ;
in6_dev_put ( idev ) ;
}
}
static void ip6_dst_ifdown ( struct dst_entry * dst , struct net_device * dev ,
int how )
{
struct rt6_info * rt = ( struct rt6_info * ) dst ;
struct inet6_dev * idev = rt - > rt6i_idev ;
if ( dev ! = & loopback_dev & & idev ! = NULL & & idev - > dev = = dev ) {
struct inet6_dev * loopback_idev = in6_dev_get ( & loopback_dev ) ;
if ( loopback_idev ! = NULL ) {
rt - > rt6i_idev = loopback_idev ;
in6_dev_put ( idev ) ;
}
}
}
static __inline__ int rt6_check_expired ( const struct rt6_info * rt )
{
return ( rt - > rt6i_flags & RTF_EXPIRES & &
time_after ( jiffies , rt - > rt6i_expires ) ) ;
}
2006-08-05 10:20:06 +04:00
static inline int rt6_need_strict ( struct in6_addr * daddr )
{
return ( ipv6_addr_type ( daddr ) &
( IPV6_ADDR_MULTICAST | IPV6_ADDR_LINKLOCAL ) ) ;
}
2005-04-17 02:20:36 +04:00
/*
2006-08-05 10:20:06 +04:00
* Route lookup . Any table - > tb6_lock is implied .
2005-04-17 02:20:36 +04:00
*/
static __inline__ struct rt6_info * rt6_device_match ( struct rt6_info * rt ,
int oif ,
int strict )
{
struct rt6_info * local = NULL ;
struct rt6_info * sprt ;
if ( oif ) {
for ( sprt = rt ; sprt ; sprt = sprt - > u . next ) {
struct net_device * dev = sprt - > rt6i_dev ;
if ( dev - > ifindex = = oif )
return sprt ;
if ( dev - > flags & IFF_LOOPBACK ) {
if ( sprt - > rt6i_idev = = NULL | |
sprt - > rt6i_idev - > dev - > ifindex ! = oif ) {
if ( strict & & oif )
continue ;
if ( local & & ( ! oif | |
local - > rt6i_idev - > dev - > ifindex = = oif ) )
continue ;
}
local = sprt ;
}
}
if ( local )
return local ;
if ( strict )
return & ip6_null_entry ;
}
return rt ;
}
2006-03-21 04:05:13 +03:00
# ifdef CONFIG_IPV6_ROUTER_PREF
static void rt6_probe ( struct rt6_info * rt )
{
struct neighbour * neigh = rt ? rt - > rt6i_nexthop : NULL ;
/*
* Okay , this does not seem to be appropriate
* for now , however , we need to check if it
* is really so ; aka Router Reachability Probing .
*
* Router Reachability Probe MUST be rate - limited
* to no more than one per minute .
*/
if ( ! neigh | | ( neigh - > nud_state & NUD_VALID ) )
return ;
read_lock_bh ( & neigh - > lock ) ;
if ( ! ( neigh - > nud_state & NUD_VALID ) & &
2006-03-21 04:05:47 +03:00
time_after ( jiffies , neigh - > updated + rt - > rt6i_idev - > cnf . rtr_probe_interval ) ) {
2006-03-21 04:05:13 +03:00
struct in6_addr mcaddr ;
struct in6_addr * target ;
neigh - > updated = jiffies ;
read_unlock_bh ( & neigh - > lock ) ;
target = ( struct in6_addr * ) & neigh - > primary_key ;
addrconf_addr_solict_mult ( target , & mcaddr ) ;
ndisc_send_ns ( rt - > rt6i_dev , NULL , target , & mcaddr , NULL ) ;
} else
read_unlock_bh ( & neigh - > lock ) ;
}
# else
static inline void rt6_probe ( struct rt6_info * rt )
{
return ;
}
# endif
2005-04-17 02:20:36 +04:00
/*
2006-03-21 04:00:26 +03:00
* Default Router Selection ( RFC 2461 6.3 .6 )
2005-04-17 02:20:36 +04:00
*/
2006-03-21 04:00:26 +03:00
static int inline rt6_check_dev ( struct rt6_info * rt , int oif )
{
struct net_device * dev = rt - > rt6i_dev ;
if ( ! oif | | dev - > ifindex = = oif )
return 2 ;
if ( ( dev - > flags & IFF_LOOPBACK ) & &
rt - > rt6i_idev & & rt - > rt6i_idev - > dev - > ifindex = = oif )
return 1 ;
return 0 ;
}
2005-04-17 02:20:36 +04:00
2006-03-21 04:00:26 +03:00
static int inline rt6_check_neigh ( struct rt6_info * rt )
2005-04-17 02:20:36 +04:00
{
2006-03-21 04:00:26 +03:00
struct neighbour * neigh = rt - > rt6i_nexthop ;
int m = 0 ;
2006-05-27 00:23:41 +04:00
if ( rt - > rt6i_flags & RTF_NONEXTHOP | |
! ( rt - > rt6i_flags & RTF_GATEWAY ) )
m = 1 ;
else if ( neigh ) {
2006-03-21 04:00:26 +03:00
read_lock_bh ( & neigh - > lock ) ;
if ( neigh - > nud_state & NUD_VALID )
2006-05-27 00:23:41 +04:00
m = 2 ;
2006-11-06 20:45:44 +03:00
else if ( ! ( neigh - > nud_state & NUD_FAILED ) )
m = 1 ;
2006-03-21 04:00:26 +03:00
read_unlock_bh ( & neigh - > lock ) ;
2005-04-17 02:20:36 +04:00
}
2006-03-21 04:00:26 +03:00
return m ;
2005-04-17 02:20:36 +04:00
}
2006-03-21 04:00:26 +03:00
static int rt6_score_route ( struct rt6_info * rt , int oif ,
int strict )
2005-04-17 02:20:36 +04:00
{
2006-05-27 00:23:41 +04:00
int m , n ;
m = rt6_check_dev ( rt , oif ) ;
2006-08-24 04:25:05 +04:00
if ( ! m & & ( strict & RT6_LOOKUP_F_IFACE ) )
2006-03-21 04:00:26 +03:00
return - 1 ;
2006-03-21 04:04:53 +03:00
# ifdef CONFIG_IPV6_ROUTER_PREF
m | = IPV6_DECODE_PREF ( IPV6_EXTRACT_PREF ( rt - > rt6i_flags ) ) < < 2 ;
# endif
2006-05-27 00:23:41 +04:00
n = rt6_check_neigh ( rt ) ;
2006-11-06 20:45:45 +03:00
if ( ! n & & ( strict & RT6_LOOKUP_F_REACHABLE ) )
2006-03-21 04:00:26 +03:00
return - 1 ;
return m ;
}
static struct rt6_info * rt6_select ( struct rt6_info * * head , int oif ,
int strict )
{
struct rt6_info * match = NULL , * last = NULL ;
struct rt6_info * rt , * rt0 = * head ;
u32 metric ;
int mpri = - 1 ;
2005-04-17 02:20:36 +04:00
2006-03-21 04:00:26 +03:00
RT6_TRACE ( " %s(head=%p(*head=%p), oif=%d) \n " ,
__FUNCTION__ , head , head ? * head : NULL , oif ) ;
2005-04-17 02:20:36 +04:00
2006-03-21 04:00:26 +03:00
for ( rt = rt0 , metric = rt0 - > rt6i_metric ;
2006-04-29 02:59:15 +04:00
rt & & rt - > rt6i_metric = = metric & & ( ! last | | rt ! = rt0 ) ;
2006-03-21 04:00:26 +03:00
rt = rt - > u . next ) {
int m ;
2005-04-17 02:20:36 +04:00
2006-03-21 04:00:26 +03:00
if ( rt6_check_expired ( rt ) )
2005-04-17 02:20:36 +04:00
continue ;
2006-03-21 04:00:26 +03:00
last = rt ;
m = rt6_score_route ( rt , oif , strict ) ;
if ( m < 0 )
2005-04-17 02:20:36 +04:00
continue ;
2006-03-21 04:00:26 +03:00
if ( m > mpri ) {
2006-03-21 04:05:13 +03:00
rt6_probe ( match ) ;
2006-03-21 04:00:26 +03:00
match = rt ;
2005-04-17 02:20:36 +04:00
mpri = m ;
2006-03-21 04:05:13 +03:00
} else {
rt6_probe ( rt ) ;
2005-04-17 02:20:36 +04:00
}
}
2006-03-21 04:00:26 +03:00
if ( ! match & &
2006-08-24 04:25:05 +04:00
( strict & RT6_LOOKUP_F_REACHABLE ) & &
2006-03-21 04:00:26 +03:00
last & & last ! = rt0 ) {
/* no entries matched; do round-robin */
2006-06-27 13:53:55 +04:00
static DEFINE_SPINLOCK ( lock ) ;
2006-04-29 02:59:15 +04:00
spin_lock ( & lock ) ;
2006-03-21 04:00:26 +03:00
* head = rt0 - > u . next ;
rt0 - > u . next = last - > u . next ;
last - > u . next = rt0 ;
2006-04-29 02:59:15 +04:00
spin_unlock ( & lock ) ;
2005-04-17 02:20:36 +04:00
}
2006-03-21 04:00:26 +03:00
RT6_TRACE ( " %s() => %p, score=%d \n " ,
__FUNCTION__ , match , mpri ) ;
2005-04-17 02:20:36 +04:00
2006-03-21 04:00:26 +03:00
return ( match ? match : & ip6_null_entry ) ;
2005-04-17 02:20:36 +04:00
}
2006-03-21 04:06:24 +03:00
# ifdef CONFIG_IPV6_ROUTE_INFO
int rt6_route_rcv ( struct net_device * dev , u8 * opt , int len ,
struct in6_addr * gwaddr )
{
struct route_info * rinfo = ( struct route_info * ) opt ;
struct in6_addr prefix_buf , * prefix ;
unsigned int pref ;
u32 lifetime ;
struct rt6_info * rt ;
if ( len < sizeof ( struct route_info ) ) {
return - EINVAL ;
}
/* Sanity check for prefix_len and length */
if ( rinfo - > length > 3 ) {
return - EINVAL ;
} else if ( rinfo - > prefix_len > 128 ) {
return - EINVAL ;
} else if ( rinfo - > prefix_len > 64 ) {
if ( rinfo - > length < 2 ) {
return - EINVAL ;
}
} else if ( rinfo - > prefix_len > 0 ) {
if ( rinfo - > length < 1 ) {
return - EINVAL ;
}
}
pref = rinfo - > route_pref ;
if ( pref = = ICMPV6_ROUTER_PREF_INVALID )
pref = ICMPV6_ROUTER_PREF_MEDIUM ;
lifetime = htonl ( rinfo - > lifetime ) ;
if ( lifetime = = 0xffffffff ) {
/* infinity */
} else if ( lifetime > 0x7fffffff / HZ ) {
/* Avoid arithmetic overflow */
lifetime = 0x7fffffff / HZ - 1 ;
}
if ( rinfo - > length = = 3 )
prefix = ( struct in6_addr * ) rinfo - > prefix ;
else {
/* this function is safe */
ipv6_addr_prefix ( & prefix_buf ,
( struct in6_addr * ) rinfo - > prefix ,
rinfo - > prefix_len ) ;
prefix = & prefix_buf ;
}
rt = rt6_get_route_info ( prefix , rinfo - > prefix_len , gwaddr , dev - > ifindex ) ;
if ( rt & & ! lifetime ) {
2006-08-22 11:00:21 +04:00
ip6_del_rt ( rt ) ;
2006-03-21 04:06:24 +03:00
rt = NULL ;
}
if ( ! rt & & lifetime )
rt = rt6_add_route_info ( prefix , rinfo - > prefix_len , gwaddr , dev - > ifindex ,
pref ) ;
else if ( rt )
rt - > rt6i_flags = RTF_ROUTEINFO |
( rt - > rt6i_flags & ~ RTF_PREF_MASK ) | RTF_PREF ( pref ) ;
if ( rt ) {
if ( lifetime = = 0xffffffff ) {
rt - > rt6i_flags & = ~ RTF_EXPIRES ;
} else {
rt - > rt6i_expires = jiffies + HZ * lifetime ;
rt - > rt6i_flags | = RTF_EXPIRES ;
}
dst_release ( & rt - > u . dst ) ;
}
return 0 ;
}
# endif
2006-08-24 04:22:39 +04:00
# define BACKTRACK(saddr) \
do { \
if ( rt = = & ip6_null_entry ) { \
struct fib6_node * pn ; \
2006-10-17 09:11:11 +04:00
while ( 1 ) { \
2006-08-24 04:22:39 +04:00
if ( fn - > fn_flags & RTN_TL_ROOT ) \
goto out ; \
pn = fn - > parent ; \
if ( FIB6_SUBTREE ( pn ) & & FIB6_SUBTREE ( pn ) ! = fn ) \
fn = fib6_lookup ( pn - > subtree , NULL , saddr ) ; \
else \
fn = pn ; \
if ( fn - > fn_flags & RTN_RTINFO ) \
goto restart ; \
2006-08-05 10:20:06 +04:00
} \
} \
2006-08-24 04:22:39 +04:00
} while ( 0 )
2006-08-05 10:20:06 +04:00
static struct rt6_info * ip6_pol_route_lookup ( struct fib6_table * table ,
struct flowi * fl , int flags )
2005-04-17 02:20:36 +04:00
{
struct fib6_node * fn ;
struct rt6_info * rt ;
2006-08-05 10:20:06 +04:00
read_lock_bh ( & table - > tb6_lock ) ;
fn = fib6_lookup ( & table - > tb6_root , & fl - > fl6_dst , & fl - > fl6_src ) ;
restart :
rt = fn - > leaf ;
2006-08-24 04:25:05 +04:00
rt = rt6_device_match ( rt , fl - > oif , flags ) ;
2006-08-24 04:22:39 +04:00
BACKTRACK ( & fl - > fl6_src ) ;
2006-08-05 10:20:06 +04:00
out :
2006-08-29 00:19:30 +04:00
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
rt - > u . dst . lastuse = jiffies ;
2006-08-05 10:20:06 +04:00
rt - > u . dst . __use + + ;
return rt ;
}
struct rt6_info * rt6_lookup ( struct in6_addr * daddr , struct in6_addr * saddr ,
int oif , int strict )
{
struct flowi fl = {
. oif = oif ,
. nl_u = {
. ip6_u = {
. daddr = * daddr ,
} ,
} ,
} ;
struct dst_entry * dst ;
2006-08-24 04:25:05 +04:00
int flags = strict ? RT6_LOOKUP_F_IFACE : 0 ;
2006-08-05 10:20:06 +04:00
2006-10-14 02:01:03 +04:00
if ( saddr ) {
memcpy ( & fl . fl6_src , saddr , sizeof ( * saddr ) ) ;
flags | = RT6_LOOKUP_F_HAS_SADDR ;
}
2006-08-05 10:20:06 +04:00
dst = fib6_rule_lookup ( & fl , flags , ip6_pol_route_lookup ) ;
if ( dst - > error = = 0 )
return ( struct rt6_info * ) dst ;
dst_release ( dst ) ;
2005-04-17 02:20:36 +04:00
return NULL ;
}
2006-08-05 10:20:06 +04:00
/* ip6_ins_rt is called with FREE table->tb6_lock.
2005-04-17 02:20:36 +04:00
It takes new route entry , the addition fails by any reason the
route is freed . In any case , if caller does not hold it , it may
be destroyed .
*/
2006-08-22 11:01:08 +04:00
static int __ip6_ins_rt ( struct rt6_info * rt , struct nl_info * info )
2005-04-17 02:20:36 +04:00
{
int err ;
2006-08-05 10:20:06 +04:00
struct fib6_table * table ;
2005-04-17 02:20:36 +04:00
2006-08-05 10:20:06 +04:00
table = rt - > rt6i_table ;
write_lock_bh ( & table - > tb6_lock ) ;
2006-08-22 11:01:08 +04:00
err = fib6_add ( & table - > tb6_root , rt , info ) ;
2006-08-05 10:20:06 +04:00
write_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
return err ;
}
2006-08-22 11:00:45 +04:00
int ip6_ins_rt ( struct rt6_info * rt )
{
2006-08-22 11:01:08 +04:00
return __ip6_ins_rt ( rt , NULL ) ;
2006-08-22 11:00:45 +04:00
}
2006-03-21 03:55:51 +03:00
static struct rt6_info * rt6_alloc_cow ( struct rt6_info * ort , struct in6_addr * daddr ,
struct in6_addr * saddr )
2005-04-17 02:20:36 +04:00
{
struct rt6_info * rt ;
/*
* Clone the route .
*/
rt = ip6_rt_copy ( ort ) ;
if ( rt ) {
2005-12-21 16:56:42 +03:00
if ( ! ( rt - > rt6i_flags & RTF_GATEWAY ) ) {
if ( rt - > rt6i_dst . plen ! = 128 & &
ipv6_addr_equal ( & rt - > rt6i_dst . addr , daddr ) )
rt - > rt6i_flags | = RTF_ANYCAST ;
2005-04-17 02:20:36 +04:00
ipv6_addr_copy ( & rt - > rt6i_gateway , daddr ) ;
2005-12-21 16:56:42 +03:00
}
2005-04-17 02:20:36 +04:00
2005-12-21 16:56:42 +03:00
ipv6_addr_copy ( & rt - > rt6i_dst . addr , daddr ) ;
2005-04-17 02:20:36 +04:00
rt - > rt6i_dst . plen = 128 ;
rt - > rt6i_flags | = RTF_CACHE ;
rt - > u . dst . flags | = DST_HOST ;
# ifdef CONFIG_IPV6_SUBTREES
if ( rt - > rt6i_src . plen & & saddr ) {
ipv6_addr_copy ( & rt - > rt6i_src . addr , saddr ) ;
rt - > rt6i_src . plen = 128 ;
}
# endif
rt - > rt6i_nexthop = ndisc_get_neigh ( rt - > rt6i_dev , & rt - > rt6i_gateway ) ;
2006-03-21 03:55:51 +03:00
}
2005-04-17 02:20:36 +04:00
2006-03-21 03:55:51 +03:00
return rt ;
}
2005-04-17 02:20:36 +04:00
2006-03-21 03:58:32 +03:00
static struct rt6_info * rt6_alloc_clone ( struct rt6_info * ort , struct in6_addr * daddr )
{
struct rt6_info * rt = ip6_rt_copy ( ort ) ;
if ( rt ) {
ipv6_addr_copy ( & rt - > rt6i_dst . addr , daddr ) ;
rt - > rt6i_dst . plen = 128 ;
rt - > rt6i_flags | = RTF_CACHE ;
rt - > u . dst . flags | = DST_HOST ;
rt - > rt6i_nexthop = neigh_clone ( ort - > rt6i_nexthop ) ;
}
return rt ;
}
2006-08-08 08:50:48 +04:00
static struct rt6_info * ip6_pol_route_input ( struct fib6_table * table ,
struct flowi * fl , int flags )
2005-04-17 02:20:36 +04:00
{
struct fib6_node * fn ;
2006-03-21 04:00:05 +03:00
struct rt6_info * rt , * nrt ;
2006-08-05 10:20:06 +04:00
int strict = 0 ;
2005-04-17 02:20:36 +04:00
int attempts = 3 ;
2006-03-21 04:00:05 +03:00
int err ;
2006-08-24 04:25:05 +04:00
int reachable = RT6_LOOKUP_F_REACHABLE ;
2005-04-17 02:20:36 +04:00
2006-08-24 04:25:05 +04:00
strict | = flags & RT6_LOOKUP_F_IFACE ;
2005-04-17 02:20:36 +04:00
relookup :
2006-08-05 10:20:06 +04:00
read_lock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
2006-03-21 04:04:35 +03:00
restart_2 :
2006-08-05 10:20:06 +04:00
fn = fib6_lookup ( & table - > tb6_root , & fl - > fl6_dst , & fl - > fl6_src ) ;
2005-04-17 02:20:36 +04:00
restart :
2006-08-05 10:20:06 +04:00
rt = rt6_select ( & fn - > leaf , fl - > iif , strict | reachable ) ;
2006-08-24 04:22:39 +04:00
BACKTRACK ( & fl - > fl6_src ) ;
2006-03-21 04:04:35 +03:00
if ( rt = = & ip6_null_entry | |
rt - > rt6i_flags & RTF_CACHE )
2006-03-21 04:01:24 +03:00
goto out ;
2005-04-17 02:20:36 +04:00
2006-03-21 03:59:08 +03:00
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2006-03-21 03:59:08 +03:00
2006-03-21 04:00:05 +03:00
if ( ! rt - > rt6i_nexthop & & ! ( rt - > rt6i_flags & RTF_NONEXTHOP ) )
2006-08-05 10:20:06 +04:00
nrt = rt6_alloc_cow ( rt , & fl - > fl6_dst , & fl - > fl6_src ) ;
2006-03-21 04:00:05 +03:00
else {
# if CLONE_OFFLINK_ROUTE
2006-08-05 10:20:06 +04:00
nrt = rt6_alloc_clone ( rt , & fl - > fl6_dst ) ;
2006-03-21 04:00:05 +03:00
# else
goto out2 ;
# endif
}
2006-03-21 03:59:27 +03:00
2006-03-21 04:00:05 +03:00
dst_release ( & rt - > u . dst ) ;
rt = nrt ? : & ip6_null_entry ;
2005-04-17 02:20:36 +04:00
2006-03-21 04:00:05 +03:00
dst_hold ( & rt - > u . dst ) ;
if ( nrt ) {
2006-08-22 11:00:45 +04:00
err = ip6_ins_rt ( nrt ) ;
2006-03-21 04:00:05 +03:00
if ( ! err )
2005-04-17 02:20:36 +04:00
goto out2 ;
}
2006-03-21 04:00:05 +03:00
if ( - - attempts < = 0 )
goto out2 ;
/*
2006-08-05 10:20:06 +04:00
* Race condition ! In the gap , when table - > tb6_lock was
2006-03-21 04:00:05 +03:00
* released someone could insert this route . Relookup .
*/
dst_release ( & rt - > u . dst ) ;
goto relookup ;
out :
2006-03-21 04:04:35 +03:00
if ( reachable ) {
reachable = 0 ;
goto restart_2 ;
}
2006-03-21 04:00:05 +03:00
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
out2 :
rt - > u . dst . lastuse = jiffies ;
rt - > u . dst . __use + + ;
2006-08-05 10:20:06 +04:00
return rt ;
2005-04-17 02:20:36 +04:00
}
2006-08-05 10:20:06 +04:00
void ip6_route_input ( struct sk_buff * skb )
{
struct ipv6hdr * iph = skb - > nh . ipv6h ;
2006-10-14 02:01:03 +04:00
int flags = RT6_LOOKUP_F_HAS_SADDR ;
2006-08-05 10:20:06 +04:00
struct flowi fl = {
. iif = skb - > dev - > ifindex ,
. nl_u = {
. ip6_u = {
. daddr = iph - > daddr ,
. saddr = iph - > saddr ,
2006-08-26 03:07:48 +04:00
# ifdef CONFIG_IPV6_ROUTE_FWMARK
2006-08-21 14:22:01 +04:00
. fwmark = skb - > nfmark ,
2006-08-26 03:07:48 +04:00
# endif
2006-08-05 10:20:06 +04:00
. flowlabel = ( * ( u32 * ) iph ) & IPV6_FLOWINFO_MASK ,
} ,
} ,
. proto = iph - > nexthdr ,
} ;
2006-10-14 02:01:03 +04:00
if ( rt6_need_strict ( & iph - > daddr ) )
flags | = RT6_LOOKUP_F_IFACE ;
2006-08-05 10:20:06 +04:00
skb - > dst = fib6_rule_lookup ( & fl , flags , ip6_pol_route_input ) ;
}
static struct rt6_info * ip6_pol_route_output ( struct fib6_table * table ,
struct flowi * fl , int flags )
2005-04-17 02:20:36 +04:00
{
struct fib6_node * fn ;
2006-03-21 04:00:05 +03:00
struct rt6_info * rt , * nrt ;
2006-08-05 10:20:06 +04:00
int strict = 0 ;
2005-04-17 02:20:36 +04:00
int attempts = 3 ;
2006-03-21 04:00:05 +03:00
int err ;
2006-08-24 04:25:05 +04:00
int reachable = RT6_LOOKUP_F_REACHABLE ;
2005-04-17 02:20:36 +04:00
2006-08-24 04:25:05 +04:00
strict | = flags & RT6_LOOKUP_F_IFACE ;
2005-04-17 02:20:36 +04:00
relookup :
2006-08-05 10:20:06 +04:00
read_lock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
2006-03-21 04:04:35 +03:00
restart_2 :
2006-08-05 10:20:06 +04:00
fn = fib6_lookup ( & table - > tb6_root , & fl - > fl6_dst , & fl - > fl6_src ) ;
2005-04-17 02:20:36 +04:00
restart :
2006-03-21 04:04:35 +03:00
rt = rt6_select ( & fn - > leaf , fl - > oif , strict | reachable ) ;
2006-08-24 04:22:39 +04:00
BACKTRACK ( & fl - > fl6_src ) ;
2006-03-21 04:04:35 +03:00
if ( rt = = & ip6_null_entry | |
rt - > rt6i_flags & RTF_CACHE )
2005-04-17 02:20:36 +04:00
goto out ;
2006-03-21 03:59:08 +03:00
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2006-03-21 03:59:08 +03:00
2006-03-21 04:00:05 +03:00
if ( ! rt - > rt6i_nexthop & & ! ( rt - > rt6i_flags & RTF_NONEXTHOP ) )
2006-03-21 03:59:27 +03:00
nrt = rt6_alloc_cow ( rt , & fl - > fl6_dst , & fl - > fl6_src ) ;
2006-03-21 04:00:05 +03:00
else {
# if CLONE_OFFLINK_ROUTE
nrt = rt6_alloc_clone ( rt , & fl - > fl6_dst ) ;
# else
goto out2 ;
# endif
}
2005-04-17 02:20:36 +04:00
2006-03-21 04:00:05 +03:00
dst_release ( & rt - > u . dst ) ;
rt = nrt ? : & ip6_null_entry ;
2005-04-17 02:20:36 +04:00
2006-03-21 04:00:05 +03:00
dst_hold ( & rt - > u . dst ) ;
if ( nrt ) {
2006-08-22 11:00:45 +04:00
err = ip6_ins_rt ( nrt ) ;
2006-03-21 04:00:05 +03:00
if ( ! err )
2005-04-17 02:20:36 +04:00
goto out2 ;
}
2006-03-21 03:59:27 +03:00
2006-03-21 04:00:05 +03:00
if ( - - attempts < = 0 )
goto out2 ;
/*
2006-08-05 10:20:06 +04:00
* Race condition ! In the gap , when table - > tb6_lock was
2006-03-21 04:00:05 +03:00
* released someone could insert this route . Relookup .
*/
dst_release ( & rt - > u . dst ) ;
goto relookup ;
out :
2006-03-21 04:04:35 +03:00
if ( reachable ) {
reachable = 0 ;
goto restart_2 ;
}
2006-03-21 04:00:05 +03:00
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
out2 :
rt - > u . dst . lastuse = jiffies ;
rt - > u . dst . __use + + ;
2006-08-05 10:20:06 +04:00
return rt ;
}
struct dst_entry * ip6_route_output ( struct sock * sk , struct flowi * fl )
{
int flags = 0 ;
if ( rt6_need_strict ( & fl - > fl6_dst ) )
2006-08-24 04:25:05 +04:00
flags | = RT6_LOOKUP_F_IFACE ;
2006-08-05 10:20:06 +04:00
2006-10-14 02:01:03 +04:00
if ( ! ipv6_addr_any ( & fl - > fl6_src ) )
flags | = RT6_LOOKUP_F_HAS_SADDR ;
2006-08-05 10:20:06 +04:00
return fib6_rule_lookup ( fl , flags , ip6_pol_route_output ) ;
2005-04-17 02:20:36 +04:00
}
/*
* Destination cache support functions
*/
static struct dst_entry * ip6_dst_check ( struct dst_entry * dst , u32 cookie )
{
struct rt6_info * rt ;
rt = ( struct rt6_info * ) dst ;
if ( rt & & rt - > rt6i_node & & ( rt - > rt6i_node - > fn_sernum = = cookie ) )
return dst ;
return NULL ;
}
static struct dst_entry * ip6_negative_advice ( struct dst_entry * dst )
{
struct rt6_info * rt = ( struct rt6_info * ) dst ;
if ( rt ) {
if ( rt - > rt6i_flags & RTF_CACHE )
2006-08-22 11:00:21 +04:00
ip6_del_rt ( rt ) ;
2005-04-17 02:20:36 +04:00
else
dst_release ( dst ) ;
}
return NULL ;
}
static void ip6_link_failure ( struct sk_buff * skb )
{
struct rt6_info * rt ;
icmpv6_send ( skb , ICMPV6_DEST_UNREACH , ICMPV6_ADDR_UNREACH , 0 , skb - > dev ) ;
rt = ( struct rt6_info * ) skb - > dst ;
if ( rt ) {
if ( rt - > rt6i_flags & RTF_CACHE ) {
dst_set_expires ( & rt - > u . dst , 0 ) ;
rt - > rt6i_flags | = RTF_EXPIRES ;
} else if ( rt - > rt6i_node & & ( rt - > rt6i_flags & RTF_DEFAULT ) )
rt - > rt6i_node - > fn_sernum = - 1 ;
}
}
static void ip6_rt_update_pmtu ( struct dst_entry * dst , u32 mtu )
{
struct rt6_info * rt6 = ( struct rt6_info * ) dst ;
if ( mtu < dst_mtu ( dst ) & & rt6 - > rt6i_dst . plen = = 128 ) {
rt6 - > rt6i_flags | = RTF_MODIFIED ;
if ( mtu < IPV6_MIN_MTU ) {
mtu = IPV6_MIN_MTU ;
dst - > metrics [ RTAX_FEATURES - 1 ] | = RTAX_FEATURE_ALLFRAG ;
}
dst - > metrics [ RTAX_MTU - 1 ] = mtu ;
2006-07-31 07:43:36 +04:00
call_netevent_notifiers ( NETEVENT_PMTU_UPDATE , dst ) ;
2005-04-17 02:20:36 +04:00
}
}
static int ipv6_get_mtu ( struct net_device * dev ) ;
static inline unsigned int ipv6_advmss ( unsigned int mtu )
{
mtu - = sizeof ( struct ipv6hdr ) + sizeof ( struct tcphdr ) ;
if ( mtu < ip6_rt_min_advmss )
mtu = ip6_rt_min_advmss ;
/*
* Maximal non - jumbo IPv6 payload is IPV6_MAXPLEN and
* corresponding MSS is IPV6_MAXPLEN - tcp_header_size .
* IPV6_MAXPLEN is also valid and means : " any MSS,
* rely only on pmtu discovery "
*/
if ( mtu > IPV6_MAXPLEN - sizeof ( struct tcphdr ) )
mtu = IPV6_MAXPLEN ;
return mtu ;
}
2006-08-04 14:37:36 +04:00
static struct dst_entry * ndisc_dst_gc_list ;
2006-08-08 08:50:48 +04:00
static DEFINE_SPINLOCK ( ndisc_lock ) ;
2006-08-04 14:37:36 +04:00
2005-04-17 02:20:36 +04:00
struct dst_entry * ndisc_dst_alloc ( struct net_device * dev ,
struct neighbour * neigh ,
struct in6_addr * addr ,
int ( * output ) ( struct sk_buff * ) )
{
struct rt6_info * rt ;
struct inet6_dev * idev = in6_dev_get ( dev ) ;
if ( unlikely ( idev = = NULL ) )
return NULL ;
rt = ip6_dst_alloc ( ) ;
if ( unlikely ( rt = = NULL ) ) {
in6_dev_put ( idev ) ;
goto out ;
}
dev_hold ( dev ) ;
if ( neigh )
neigh_hold ( neigh ) ;
else
neigh = ndisc_get_neigh ( dev , addr ) ;
rt - > rt6i_dev = dev ;
rt - > rt6i_idev = idev ;
rt - > rt6i_nexthop = neigh ;
atomic_set ( & rt - > u . dst . __refcnt , 1 ) ;
rt - > u . dst . metrics [ RTAX_HOPLIMIT - 1 ] = 255 ;
rt - > u . dst . metrics [ RTAX_MTU - 1 ] = ipv6_get_mtu ( rt - > rt6i_dev ) ;
rt - > u . dst . metrics [ RTAX_ADVMSS - 1 ] = ipv6_advmss ( dst_mtu ( & rt - > u . dst ) ) ;
rt - > u . dst . output = output ;
#if 0 /* there's no chance to use these for ndisc */
rt - > u . dst . flags = ipv6_addr_type ( addr ) & IPV6_ADDR_UNICAST
? DST_HOST
: 0 ;
ipv6_addr_copy ( & rt - > rt6i_dst . addr , addr ) ;
rt - > rt6i_dst . plen = 128 ;
# endif
2006-08-04 14:37:36 +04:00
spin_lock_bh ( & ndisc_lock ) ;
2005-04-17 02:20:36 +04:00
rt - > u . dst . next = ndisc_dst_gc_list ;
ndisc_dst_gc_list = & rt - > u . dst ;
2006-08-04 14:37:36 +04:00
spin_unlock_bh ( & ndisc_lock ) ;
2005-04-17 02:20:36 +04:00
fib6_force_start_gc ( ) ;
out :
return ( struct dst_entry * ) rt ;
}
int ndisc_dst_gc ( int * more )
{
struct dst_entry * dst , * next , * * pprev ;
int freed ;
next = NULL ;
2006-08-04 14:37:36 +04:00
freed = 0 ;
spin_lock_bh ( & ndisc_lock ) ;
2005-04-17 02:20:36 +04:00
pprev = & ndisc_dst_gc_list ;
2006-08-04 14:37:36 +04:00
2005-04-17 02:20:36 +04:00
while ( ( dst = * pprev ) ! = NULL ) {
if ( ! atomic_read ( & dst - > __refcnt ) ) {
* pprev = dst - > next ;
dst_free ( dst ) ;
freed + + ;
} else {
pprev = & dst - > next ;
( * more ) + + ;
}
}
2006-08-04 14:37:36 +04:00
spin_unlock_bh ( & ndisc_lock ) ;
2005-04-17 02:20:36 +04:00
return freed ;
}
static int ip6_dst_gc ( void )
{
static unsigned expire = 30 * HZ ;
static unsigned long last_gc ;
unsigned long now = jiffies ;
if ( time_after ( last_gc + ip6_rt_gc_min_interval , now ) & &
atomic_read ( & ip6_dst_ops . entries ) < = ip6_rt_max_size )
goto out ;
expire + + ;
fib6_run_gc ( expire ) ;
last_gc = now ;
if ( atomic_read ( & ip6_dst_ops . entries ) < ip6_dst_ops . gc_thresh )
expire = ip6_rt_gc_timeout > > 1 ;
out :
expire - = expire > > ip6_rt_gc_elasticity ;
return ( atomic_read ( & ip6_dst_ops . entries ) > ip6_rt_max_size ) ;
}
/* Clean host part of a prefix. Not necessary in radix tree,
but results in cleaner routing tables .
Remove it only when all the things will work !
*/
static int ipv6_get_mtu ( struct net_device * dev )
{
int mtu = IPV6_MIN_MTU ;
struct inet6_dev * idev ;
idev = in6_dev_get ( dev ) ;
if ( idev ) {
mtu = idev - > cnf . mtu6 ;
in6_dev_put ( idev ) ;
}
return mtu ;
}
int ipv6_get_hoplimit ( struct net_device * dev )
{
int hoplimit = ipv6_devconf . hop_limit ;
struct inet6_dev * idev ;
idev = in6_dev_get ( dev ) ;
if ( idev ) {
hoplimit = idev - > cnf . hop_limit ;
in6_dev_put ( idev ) ;
}
return hoplimit ;
}
/*
*
*/
2006-08-22 11:01:08 +04:00
int ip6_route_add ( struct fib6_config * cfg )
2005-04-17 02:20:36 +04:00
{
int err ;
struct rt6_info * rt = NULL ;
struct net_device * dev = NULL ;
struct inet6_dev * idev = NULL ;
2006-08-05 10:20:06 +04:00
struct fib6_table * table ;
2005-04-17 02:20:36 +04:00
int addr_type ;
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_dst_len > 128 | | cfg - > fc_src_len > 128 )
2005-04-17 02:20:36 +04:00
return - EINVAL ;
# ifndef CONFIG_IPV6_SUBTREES
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_src_len )
2005-04-17 02:20:36 +04:00
return - EINVAL ;
# endif
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_ifindex ) {
2005-04-17 02:20:36 +04:00
err = - ENODEV ;
2006-08-22 11:01:08 +04:00
dev = dev_get_by_index ( cfg - > fc_ifindex ) ;
2005-04-17 02:20:36 +04:00
if ( ! dev )
goto out ;
idev = in6_dev_get ( dev ) ;
if ( ! idev )
goto out ;
}
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_metric = = 0 )
cfg - > fc_metric = IP6_RT_PRIO_USER ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
table = fib6_new_table ( cfg - > fc_table ) ;
2006-08-05 10:20:06 +04:00
if ( table = = NULL ) {
err = - ENOBUFS ;
goto out ;
}
2005-04-17 02:20:36 +04:00
rt = ip6_dst_alloc ( ) ;
if ( rt = = NULL ) {
err = - ENOMEM ;
goto out ;
}
rt - > u . dst . obsolete = - 1 ;
2006-08-22 11:01:08 +04:00
rt - > rt6i_expires = jiffies + clock_t_to_jiffies ( cfg - > fc_expires ) ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_protocol = = RTPROT_UNSPEC )
cfg - > fc_protocol = RTPROT_BOOT ;
rt - > rt6i_protocol = cfg - > fc_protocol ;
addr_type = ipv6_addr_type ( & cfg - > fc_dst ) ;
2005-04-17 02:20:36 +04:00
if ( addr_type & IPV6_ADDR_MULTICAST )
rt - > u . dst . input = ip6_mc_input ;
else
rt - > u . dst . input = ip6_forward ;
rt - > u . dst . output = ip6_output ;
2006-08-22 11:01:08 +04:00
ipv6_addr_prefix ( & rt - > rt6i_dst . addr , & cfg - > fc_dst , cfg - > fc_dst_len ) ;
rt - > rt6i_dst . plen = cfg - > fc_dst_len ;
2005-04-17 02:20:36 +04:00
if ( rt - > rt6i_dst . plen = = 128 )
rt - > u . dst . flags = DST_HOST ;
# ifdef CONFIG_IPV6_SUBTREES
2006-08-22 11:01:08 +04:00
ipv6_addr_prefix ( & rt - > rt6i_src . addr , & cfg - > fc_src , cfg - > fc_src_len ) ;
rt - > rt6i_src . plen = cfg - > fc_src_len ;
2005-04-17 02:20:36 +04:00
# endif
2006-08-22 11:01:08 +04:00
rt - > rt6i_metric = cfg - > fc_metric ;
2005-04-17 02:20:36 +04:00
/* We cannot add true routes via loopback here,
they would result in kernel looping ; promote them to reject routes
*/
2006-08-22 11:01:08 +04:00
if ( ( cfg - > fc_flags & RTF_REJECT ) | |
2005-04-17 02:20:36 +04:00
( dev & & ( dev - > flags & IFF_LOOPBACK ) & & ! ( addr_type & IPV6_ADDR_LOOPBACK ) ) ) {
/* hold loopback dev/idev if we haven't done so. */
if ( dev ! = & loopback_dev ) {
if ( dev ) {
dev_put ( dev ) ;
in6_dev_put ( idev ) ;
}
dev = & loopback_dev ;
dev_hold ( dev ) ;
idev = in6_dev_get ( dev ) ;
if ( ! idev ) {
err = - ENODEV ;
goto out ;
}
}
rt - > u . dst . output = ip6_pkt_discard_out ;
rt - > u . dst . input = ip6_pkt_discard ;
rt - > u . dst . error = - ENETUNREACH ;
rt - > rt6i_flags = RTF_REJECT | RTF_NONEXTHOP ;
goto install_route ;
}
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_flags & RTF_GATEWAY ) {
2005-04-17 02:20:36 +04:00
struct in6_addr * gw_addr ;
int gwa_type ;
2006-08-22 11:01:08 +04:00
gw_addr = & cfg - > fc_gateway ;
ipv6_addr_copy ( & rt - > rt6i_gateway , gw_addr ) ;
2005-04-17 02:20:36 +04:00
gwa_type = ipv6_addr_type ( gw_addr ) ;
if ( gwa_type ! = ( IPV6_ADDR_LINKLOCAL | IPV6_ADDR_UNICAST ) ) {
struct rt6_info * grt ;
/* IPv6 strictly inhibits using not link-local
addresses as nexthop address .
Otherwise , router will not able to send redirects .
It is very good , but in some ( rare ! ) circumstances
( SIT , PtP , NBMA NOARP links ) it is handy to allow
some exceptions . - - ANK
*/
err = - EINVAL ;
if ( ! ( gwa_type & IPV6_ADDR_UNICAST ) )
goto out ;
2006-08-22 11:01:08 +04:00
grt = rt6_lookup ( gw_addr , NULL , cfg - > fc_ifindex , 1 ) ;
2005-04-17 02:20:36 +04:00
err = - EHOSTUNREACH ;
if ( grt = = NULL )
goto out ;
if ( dev ) {
if ( dev ! = grt - > rt6i_dev ) {
dst_release ( & grt - > u . dst ) ;
goto out ;
}
} else {
dev = grt - > rt6i_dev ;
idev = grt - > rt6i_idev ;
dev_hold ( dev ) ;
in6_dev_hold ( grt - > rt6i_idev ) ;
}
if ( ! ( grt - > rt6i_flags & RTF_GATEWAY ) )
err = 0 ;
dst_release ( & grt - > u . dst ) ;
if ( err )
goto out ;
}
err = - EINVAL ;
if ( dev = = NULL | | ( dev - > flags & IFF_LOOPBACK ) )
goto out ;
}
err = - ENODEV ;
if ( dev = = NULL )
goto out ;
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_flags & ( RTF_GATEWAY | RTF_NONEXTHOP ) ) {
2005-04-17 02:20:36 +04:00
rt - > rt6i_nexthop = __neigh_lookup_errno ( & nd_tbl , & rt - > rt6i_gateway , dev ) ;
if ( IS_ERR ( rt - > rt6i_nexthop ) ) {
err = PTR_ERR ( rt - > rt6i_nexthop ) ;
rt - > rt6i_nexthop = NULL ;
goto out ;
}
}
2006-08-22 11:01:08 +04:00
rt - > rt6i_flags = cfg - > fc_flags ;
2005-04-17 02:20:36 +04:00
install_route :
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_mx ) {
struct nlattr * nla ;
int remaining ;
nla_for_each_attr ( nla , cfg - > fc_mx , cfg - > fc_mx_len , remaining ) {
int type = nla - > nla_type ;
if ( type ) {
if ( type > RTAX_MAX ) {
2005-04-17 02:20:36 +04:00
err = - EINVAL ;
goto out ;
}
2006-08-22 11:01:08 +04:00
rt - > u . dst . metrics [ type - 1 ] = nla_get_u32 ( nla ) ;
2005-04-17 02:20:36 +04:00
}
}
}
if ( rt - > u . dst . metrics [ RTAX_HOPLIMIT - 1 ] = = 0 )
rt - > u . dst . metrics [ RTAX_HOPLIMIT - 1 ] = - 1 ;
if ( ! rt - > u . dst . metrics [ RTAX_MTU - 1 ] )
rt - > u . dst . metrics [ RTAX_MTU - 1 ] = ipv6_get_mtu ( dev ) ;
if ( ! rt - > u . dst . metrics [ RTAX_ADVMSS - 1 ] )
rt - > u . dst . metrics [ RTAX_ADVMSS - 1 ] = ipv6_advmss ( dst_mtu ( & rt - > u . dst ) ) ;
rt - > u . dst . dev = dev ;
rt - > rt6i_idev = idev ;
2006-08-05 10:20:06 +04:00
rt - > rt6i_table = table ;
2006-08-22 11:01:08 +04:00
return __ip6_ins_rt ( rt , & cfg - > fc_nlinfo ) ;
2005-04-17 02:20:36 +04:00
out :
if ( dev )
dev_put ( dev ) ;
if ( idev )
in6_dev_put ( idev ) ;
if ( rt )
dst_free ( ( struct dst_entry * ) rt ) ;
return err ;
}
2006-08-22 11:01:08 +04:00
static int __ip6_del_rt ( struct rt6_info * rt , struct nl_info * info )
2005-04-17 02:20:36 +04:00
{
int err ;
2006-08-05 10:20:06 +04:00
struct fib6_table * table ;
2005-04-17 02:20:36 +04:00
2006-08-07 09:22:47 +04:00
if ( rt = = & ip6_null_entry )
return - ENOENT ;
2006-08-05 10:20:06 +04:00
table = rt - > rt6i_table ;
write_lock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
err = fib6_del ( rt , info ) ;
2005-04-17 02:20:36 +04:00
dst_release ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
write_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
return err ;
}
2006-08-22 11:00:21 +04:00
int ip6_del_rt ( struct rt6_info * rt )
{
2006-08-22 11:01:08 +04:00
return __ip6_del_rt ( rt , NULL ) ;
2006-08-22 11:00:21 +04:00
}
2006-08-22 11:01:08 +04:00
static int ip6_route_del ( struct fib6_config * cfg )
2005-04-17 02:20:36 +04:00
{
2006-08-05 10:20:06 +04:00
struct fib6_table * table ;
2005-04-17 02:20:36 +04:00
struct fib6_node * fn ;
struct rt6_info * rt ;
int err = - ESRCH ;
2006-08-22 11:01:08 +04:00
table = fib6_get_table ( cfg - > fc_table ) ;
2006-08-05 10:20:06 +04:00
if ( table = = NULL )
return err ;
read_lock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
2006-08-05 10:20:06 +04:00
fn = fib6_locate ( & table - > tb6_root ,
2006-08-22 11:01:08 +04:00
& cfg - > fc_dst , cfg - > fc_dst_len ,
& cfg - > fc_src , cfg - > fc_src_len ) ;
2005-04-17 02:20:36 +04:00
if ( fn ) {
for ( rt = fn - > leaf ; rt ; rt = rt - > u . next ) {
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_ifindex & &
2005-04-17 02:20:36 +04:00
( rt - > rt6i_dev = = NULL | |
2006-08-22 11:01:08 +04:00
rt - > rt6i_dev - > ifindex ! = cfg - > fc_ifindex ) )
2005-04-17 02:20:36 +04:00
continue ;
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_flags & RTF_GATEWAY & &
! ipv6_addr_equal ( & cfg - > fc_gateway , & rt - > rt6i_gateway ) )
2005-04-17 02:20:36 +04:00
continue ;
2006-08-22 11:01:08 +04:00
if ( cfg - > fc_metric & & cfg - > fc_metric ! = rt - > rt6i_metric )
2005-04-17 02:20:36 +04:00
continue ;
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
return __ip6_del_rt ( rt , & cfg - > fc_nlinfo ) ;
2005-04-17 02:20:36 +04:00
}
}
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
return err ;
}
/*
* Handle redirects
*/
2006-08-24 04:18:26 +04:00
struct ip6rd_flowi {
struct flowi fl ;
struct in6_addr gateway ;
} ;
static struct rt6_info * __ip6_route_redirect ( struct fib6_table * table ,
struct flowi * fl ,
int flags )
2005-04-17 02:20:36 +04:00
{
2006-08-24 04:18:26 +04:00
struct ip6rd_flowi * rdfl = ( struct ip6rd_flowi * ) fl ;
struct rt6_info * rt ;
2006-03-21 04:07:49 +03:00
struct fib6_node * fn ;
2006-08-05 10:20:06 +04:00
2005-04-17 02:20:36 +04:00
/*
2006-03-21 04:07:49 +03:00
* Get the " current " route for this destination and
* check if the redirect has come from approriate router .
*
* RFC 2461 specifies that redirects should only be
* accepted if they come from the nexthop to the target .
* Due to the way the routes are chosen , this notion
* is a bit fuzzy and one might need to check all possible
* routes .
2005-04-17 02:20:36 +04:00
*/
2006-08-05 10:20:06 +04:00
read_lock_bh ( & table - > tb6_lock ) ;
2006-08-24 04:18:26 +04:00
fn = fib6_lookup ( & table - > tb6_root , & fl - > fl6_dst , & fl - > fl6_src ) ;
2006-03-21 04:07:49 +03:00
restart :
for ( rt = fn - > leaf ; rt ; rt = rt - > u . next ) {
/*
* Current route is on - link ; redirect is always invalid .
*
* Seems , previous statement is not true . It could
* be node , which looks for us as on - link ( f . e . proxy ndisc )
* But then router serving it might decide , that we should
* know truth 8 ) 8 ) - - ANK ( 980726 ) .
*/
if ( rt6_check_expired ( rt ) )
continue ;
if ( ! ( rt - > rt6i_flags & RTF_GATEWAY ) )
continue ;
2006-08-24 04:18:26 +04:00
if ( fl - > oif ! = rt - > rt6i_dev - > ifindex )
2006-03-21 04:07:49 +03:00
continue ;
2006-08-24 04:18:26 +04:00
if ( ! ipv6_addr_equal ( & rdfl - > gateway , & rt - > rt6i_gateway ) )
2006-03-21 04:07:49 +03:00
continue ;
break ;
}
2006-08-24 04:18:26 +04:00
2006-08-24 04:23:11 +04:00
if ( ! rt )
2006-08-24 04:18:26 +04:00
rt = & ip6_null_entry ;
2006-08-24 04:23:11 +04:00
BACKTRACK ( & fl - > fl6_src ) ;
out :
2006-08-24 04:18:26 +04:00
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2006-03-21 04:07:49 +03:00
2006-08-24 04:18:26 +04:00
return rt ;
} ;
static struct rt6_info * ip6_route_redirect ( struct in6_addr * dest ,
struct in6_addr * src ,
struct in6_addr * gateway ,
struct net_device * dev )
{
2006-10-14 02:01:03 +04:00
int flags = RT6_LOOKUP_F_HAS_SADDR ;
2006-08-24 04:18:26 +04:00
struct ip6rd_flowi rdfl = {
. fl = {
. oif = dev - > ifindex ,
. nl_u = {
. ip6_u = {
. daddr = * dest ,
. saddr = * src ,
} ,
} ,
} ,
. gateway = * gateway ,
} ;
2006-10-14 02:01:03 +04:00
if ( rt6_need_strict ( dest ) )
flags | = RT6_LOOKUP_F_IFACE ;
2006-08-24 04:18:26 +04:00
return ( struct rt6_info * ) fib6_rule_lookup ( ( struct flowi * ) & rdfl , flags , __ip6_route_redirect ) ;
}
void rt6_redirect ( struct in6_addr * dest , struct in6_addr * src ,
struct in6_addr * saddr ,
struct neighbour * neigh , u8 * lladdr , int on_link )
{
struct rt6_info * rt , * nrt = NULL ;
struct netevent_redirect netevent ;
rt = ip6_route_redirect ( dest , src , saddr , neigh - > dev ) ;
if ( rt = = & ip6_null_entry ) {
2005-04-17 02:20:36 +04:00
if ( net_ratelimit ( ) )
printk ( KERN_DEBUG " rt6_redirect: source isn't a valid nexthop "
" for redirect target \n " ) ;
2006-08-24 04:18:26 +04:00
goto out ;
2005-04-17 02:20:36 +04:00
}
/*
* We have finally decided to accept it .
*/
neigh_update ( neigh , lladdr , NUD_STALE ,
NEIGH_UPDATE_F_WEAK_OVERRIDE |
NEIGH_UPDATE_F_OVERRIDE |
( on_link ? 0 : ( NEIGH_UPDATE_F_OVERRIDE_ISROUTER |
NEIGH_UPDATE_F_ISROUTER ) )
) ;
/*
* Redirect received - > path was valid .
* Look , redirects are sent only in response to data packets ,
* so that this nexthop apparently is reachable . - - ANK
*/
dst_confirm ( & rt - > u . dst ) ;
/* Duplicate redirect: silently ignore. */
if ( neigh = = rt - > u . dst . neighbour )
goto out ;
nrt = ip6_rt_copy ( rt ) ;
if ( nrt = = NULL )
goto out ;
nrt - > rt6i_flags = RTF_GATEWAY | RTF_UP | RTF_DYNAMIC | RTF_CACHE ;
if ( on_link )
nrt - > rt6i_flags & = ~ RTF_GATEWAY ;
ipv6_addr_copy ( & nrt - > rt6i_dst . addr , dest ) ;
nrt - > rt6i_dst . plen = 128 ;
nrt - > u . dst . flags | = DST_HOST ;
ipv6_addr_copy ( & nrt - > rt6i_gateway , ( struct in6_addr * ) neigh - > primary_key ) ;
nrt - > rt6i_nexthop = neigh_clone ( neigh ) ;
/* Reset pmtu, it may be better */
nrt - > u . dst . metrics [ RTAX_MTU - 1 ] = ipv6_get_mtu ( neigh - > dev ) ;
nrt - > u . dst . metrics [ RTAX_ADVMSS - 1 ] = ipv6_advmss ( dst_mtu ( & nrt - > u . dst ) ) ;
2006-08-22 11:00:45 +04:00
if ( ip6_ins_rt ( nrt ) )
2005-04-17 02:20:36 +04:00
goto out ;
2006-07-31 07:43:36 +04:00
netevent . old = & rt - > u . dst ;
netevent . new = & nrt - > u . dst ;
call_netevent_notifiers ( NETEVENT_REDIRECT , & netevent ) ;
2005-04-17 02:20:36 +04:00
if ( rt - > rt6i_flags & RTF_CACHE ) {
2006-08-22 11:00:21 +04:00
ip6_del_rt ( rt ) ;
2005-04-17 02:20:36 +04:00
return ;
}
out :
dst_release ( & rt - > u . dst ) ;
return ;
}
/*
* Handle ICMP " packet too big " messages
* i . e . Path MTU discovery
*/
void rt6_pmtu_discovery ( struct in6_addr * daddr , struct in6_addr * saddr ,
struct net_device * dev , u32 pmtu )
{
struct rt6_info * rt , * nrt ;
int allfrag = 0 ;
rt = rt6_lookup ( daddr , saddr , dev - > ifindex , 0 ) ;
if ( rt = = NULL )
return ;
if ( pmtu > = dst_mtu ( & rt - > u . dst ) )
goto out ;
if ( pmtu < IPV6_MIN_MTU ) {
/*
* According to RFC2460 , PMTU is set to the IPv6 Minimum Link
* MTU ( 1280 ) and a fragment header should always be included
* after a node receiving Too Big message reporting PMTU is
* less than the IPv6 Minimum Link MTU .
*/
pmtu = IPV6_MIN_MTU ;
allfrag = 1 ;
}
/* New mtu received -> path was valid.
They are sent only in response to data packets ,
so that this nexthop apparently is reachable . - - ANK
*/
dst_confirm ( & rt - > u . dst ) ;
/* Host route. If it is static, it would be better
not to override it , but add new one , so that
when cache entry will expire old pmtu
would return automatically .
*/
if ( rt - > rt6i_flags & RTF_CACHE ) {
rt - > u . dst . metrics [ RTAX_MTU - 1 ] = pmtu ;
if ( allfrag )
rt - > u . dst . metrics [ RTAX_FEATURES - 1 ] | = RTAX_FEATURE_ALLFRAG ;
dst_set_expires ( & rt - > u . dst , ip6_rt_mtu_expires ) ;
rt - > rt6i_flags | = RTF_MODIFIED | RTF_EXPIRES ;
goto out ;
}
/* Network route.
Two cases are possible :
1. It is connected route . Action : COW
2. It is gatewayed route or NONEXTHOP route . Action : clone it .
*/
2006-03-21 03:58:48 +03:00
if ( ! rt - > rt6i_nexthop & & ! ( rt - > rt6i_flags & RTF_NONEXTHOP ) )
2006-03-21 03:56:32 +03:00
nrt = rt6_alloc_cow ( rt , daddr , saddr ) ;
2006-03-21 03:58:48 +03:00
else
nrt = rt6_alloc_clone ( rt , daddr ) ;
2006-03-21 03:56:32 +03:00
2006-03-21 03:58:48 +03:00
if ( nrt ) {
2006-03-21 03:56:32 +03:00
nrt - > u . dst . metrics [ RTAX_MTU - 1 ] = pmtu ;
if ( allfrag )
nrt - > u . dst . metrics [ RTAX_FEATURES - 1 ] | = RTAX_FEATURE_ALLFRAG ;
/* According to RFC 1981, detecting PMTU increase shouldn't be
* happened within 5 mins , the recommended timer is 10 mins .
* Here this route expiration time is set to ip6_rt_mtu_expires
* which is 10 mins . After 10 mins the decreased pmtu is expired
* and detecting PMTU increase will be automatically happened .
*/
dst_set_expires ( & nrt - > u . dst , ip6_rt_mtu_expires ) ;
nrt - > rt6i_flags | = RTF_DYNAMIC | RTF_EXPIRES ;
2006-08-22 11:00:45 +04:00
ip6_ins_rt ( nrt ) ;
2005-04-17 02:20:36 +04:00
}
out :
dst_release ( & rt - > u . dst ) ;
}
/*
* Misc support functions
*/
static struct rt6_info * ip6_rt_copy ( struct rt6_info * ort )
{
struct rt6_info * rt = ip6_dst_alloc ( ) ;
if ( rt ) {
rt - > u . dst . input = ort - > u . dst . input ;
rt - > u . dst . output = ort - > u . dst . output ;
memcpy ( rt - > u . dst . metrics , ort - > u . dst . metrics , RTAX_MAX * sizeof ( u32 ) ) ;
2006-10-17 09:14:26 +04:00
rt - > u . dst . error = ort - > u . dst . error ;
2005-04-17 02:20:36 +04:00
rt - > u . dst . dev = ort - > u . dst . dev ;
if ( rt - > u . dst . dev )
dev_hold ( rt - > u . dst . dev ) ;
rt - > rt6i_idev = ort - > rt6i_idev ;
if ( rt - > rt6i_idev )
in6_dev_hold ( rt - > rt6i_idev ) ;
rt - > u . dst . lastuse = jiffies ;
rt - > rt6i_expires = 0 ;
ipv6_addr_copy ( & rt - > rt6i_gateway , & ort - > rt6i_gateway ) ;
rt - > rt6i_flags = ort - > rt6i_flags & ~ RTF_EXPIRES ;
rt - > rt6i_metric = 0 ;
memcpy ( & rt - > rt6i_dst , & ort - > rt6i_dst , sizeof ( struct rt6key ) ) ;
# ifdef CONFIG_IPV6_SUBTREES
memcpy ( & rt - > rt6i_src , & ort - > rt6i_src , sizeof ( struct rt6key ) ) ;
# endif
2006-08-05 10:20:06 +04:00
rt - > rt6i_table = ort - > rt6i_table ;
2005-04-17 02:20:36 +04:00
}
return rt ;
}
2006-03-21 04:06:24 +03:00
# ifdef CONFIG_IPV6_ROUTE_INFO
static struct rt6_info * rt6_get_route_info ( struct in6_addr * prefix , int prefixlen ,
struct in6_addr * gwaddr , int ifindex )
{
struct fib6_node * fn ;
struct rt6_info * rt = NULL ;
2006-08-05 10:20:06 +04:00
struct fib6_table * table ;
table = fib6_get_table ( RT6_TABLE_INFO ) ;
if ( table = = NULL )
return NULL ;
2006-03-21 04:06:24 +03:00
2006-08-05 10:20:06 +04:00
write_lock_bh ( & table - > tb6_lock ) ;
fn = fib6_locate ( & table - > tb6_root , prefix , prefixlen , NULL , 0 ) ;
2006-03-21 04:06:24 +03:00
if ( ! fn )
goto out ;
for ( rt = fn - > leaf ; rt ; rt = rt - > u . next ) {
if ( rt - > rt6i_dev - > ifindex ! = ifindex )
continue ;
if ( ( rt - > rt6i_flags & ( RTF_ROUTEINFO | RTF_GATEWAY ) ) ! = ( RTF_ROUTEINFO | RTF_GATEWAY ) )
continue ;
if ( ! ipv6_addr_equal ( & rt - > rt6i_gateway , gwaddr ) )
continue ;
dst_hold ( & rt - > u . dst ) ;
break ;
}
out :
2006-08-05 10:20:06 +04:00
write_unlock_bh ( & table - > tb6_lock ) ;
2006-03-21 04:06:24 +03:00
return rt ;
}
static struct rt6_info * rt6_add_route_info ( struct in6_addr * prefix , int prefixlen ,
struct in6_addr * gwaddr , int ifindex ,
unsigned pref )
{
2006-08-22 11:01:08 +04:00
struct fib6_config cfg = {
. fc_table = RT6_TABLE_INFO ,
. fc_metric = 1024 ,
. fc_ifindex = ifindex ,
. fc_dst_len = prefixlen ,
. fc_flags = RTF_GATEWAY | RTF_ADDRCONF | RTF_ROUTEINFO |
RTF_UP | RTF_PREF ( pref ) ,
} ;
ipv6_addr_copy ( & cfg . fc_dst , prefix ) ;
ipv6_addr_copy ( & cfg . fc_gateway , gwaddr ) ;
2006-03-21 04:06:24 +03:00
2006-03-21 04:06:42 +03:00
/* We should treat it as a default route if prefix length is 0. */
if ( ! prefixlen )
2006-08-22 11:01:08 +04:00
cfg . fc_flags | = RTF_DEFAULT ;
2006-03-21 04:06:24 +03:00
2006-08-22 11:01:08 +04:00
ip6_route_add ( & cfg ) ;
2006-03-21 04:06:24 +03:00
return rt6_get_route_info ( prefix , prefixlen , gwaddr , ifindex ) ;
}
# endif
2005-04-17 02:20:36 +04:00
struct rt6_info * rt6_get_dflt_router ( struct in6_addr * addr , struct net_device * dev )
{
struct rt6_info * rt ;
2006-08-05 10:20:06 +04:00
struct fib6_table * table ;
2005-04-17 02:20:36 +04:00
2006-08-05 10:20:06 +04:00
table = fib6_get_table ( RT6_TABLE_DFLT ) ;
if ( table = = NULL )
return NULL ;
2005-04-17 02:20:36 +04:00
2006-08-05 10:20:06 +04:00
write_lock_bh ( & table - > tb6_lock ) ;
for ( rt = table - > tb6_root . leaf ; rt ; rt = rt - > u . next ) {
2005-04-17 02:20:36 +04:00
if ( dev = = rt - > rt6i_dev & &
2006-03-21 04:00:48 +03:00
( ( rt - > rt6i_flags & ( RTF_ADDRCONF | RTF_DEFAULT ) ) = = ( RTF_ADDRCONF | RTF_DEFAULT ) ) & &
2005-04-17 02:20:36 +04:00
ipv6_addr_equal ( & rt - > rt6i_gateway , addr ) )
break ;
}
if ( rt )
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
write_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
return rt ;
}
struct rt6_info * rt6_add_dflt_router ( struct in6_addr * gwaddr ,
2006-03-21 04:04:53 +03:00
struct net_device * dev ,
unsigned int pref )
2005-04-17 02:20:36 +04:00
{
2006-08-22 11:01:08 +04:00
struct fib6_config cfg = {
. fc_table = RT6_TABLE_DFLT ,
. fc_metric = 1024 ,
. fc_ifindex = dev - > ifindex ,
. fc_flags = RTF_GATEWAY | RTF_ADDRCONF | RTF_DEFAULT |
RTF_UP | RTF_EXPIRES | RTF_PREF ( pref ) ,
} ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
ipv6_addr_copy ( & cfg . fc_gateway , gwaddr ) ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
ip6_route_add ( & cfg ) ;
2005-04-17 02:20:36 +04:00
return rt6_get_dflt_router ( gwaddr , dev ) ;
}
void rt6_purge_dflt_routers ( void )
{
struct rt6_info * rt ;
2006-08-05 10:20:06 +04:00
struct fib6_table * table ;
/* NOTE: Keep consistent with rt6_get_dflt_router */
table = fib6_get_table ( RT6_TABLE_DFLT ) ;
if ( table = = NULL )
return ;
2005-04-17 02:20:36 +04:00
restart :
2006-08-05 10:20:06 +04:00
read_lock_bh ( & table - > tb6_lock ) ;
for ( rt = table - > tb6_root . leaf ; rt ; rt = rt - > u . next ) {
2005-04-17 02:20:36 +04:00
if ( rt - > rt6i_flags & ( RTF_DEFAULT | RTF_ADDRCONF ) ) {
dst_hold ( & rt - > u . dst ) ;
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2006-08-22 11:00:21 +04:00
ip6_del_rt ( rt ) ;
2005-04-17 02:20:36 +04:00
goto restart ;
}
}
2006-08-05 10:20:06 +04:00
read_unlock_bh ( & table - > tb6_lock ) ;
2005-04-17 02:20:36 +04:00
}
2006-08-22 11:01:08 +04:00
static void rtmsg_to_fib6_config ( struct in6_rtmsg * rtmsg ,
struct fib6_config * cfg )
{
memset ( cfg , 0 , sizeof ( * cfg ) ) ;
cfg - > fc_table = RT6_TABLE_MAIN ;
cfg - > fc_ifindex = rtmsg - > rtmsg_ifindex ;
cfg - > fc_metric = rtmsg - > rtmsg_metric ;
cfg - > fc_expires = rtmsg - > rtmsg_info ;
cfg - > fc_dst_len = rtmsg - > rtmsg_dst_len ;
cfg - > fc_src_len = rtmsg - > rtmsg_src_len ;
cfg - > fc_flags = rtmsg - > rtmsg_flags ;
ipv6_addr_copy ( & cfg - > fc_dst , & rtmsg - > rtmsg_dst ) ;
ipv6_addr_copy ( & cfg - > fc_src , & rtmsg - > rtmsg_src ) ;
ipv6_addr_copy ( & cfg - > fc_gateway , & rtmsg - > rtmsg_gateway ) ;
}
2005-04-17 02:20:36 +04:00
int ipv6_route_ioctl ( unsigned int cmd , void __user * arg )
{
2006-08-22 11:01:08 +04:00
struct fib6_config cfg ;
2005-04-17 02:20:36 +04:00
struct in6_rtmsg rtmsg ;
int err ;
switch ( cmd ) {
case SIOCADDRT : /* Add a route */
case SIOCDELRT : /* Delete a route */
if ( ! capable ( CAP_NET_ADMIN ) )
return - EPERM ;
err = copy_from_user ( & rtmsg , arg ,
sizeof ( struct in6_rtmsg ) ) ;
if ( err )
return - EFAULT ;
2006-08-22 11:01:08 +04:00
rtmsg_to_fib6_config ( & rtmsg , & cfg ) ;
2005-04-17 02:20:36 +04:00
rtnl_lock ( ) ;
switch ( cmd ) {
case SIOCADDRT :
2006-08-22 11:01:08 +04:00
err = ip6_route_add ( & cfg ) ;
2005-04-17 02:20:36 +04:00
break ;
case SIOCDELRT :
2006-08-22 11:01:08 +04:00
err = ip6_route_del ( & cfg ) ;
2005-04-17 02:20:36 +04:00
break ;
default :
err = - EINVAL ;
}
rtnl_unlock ( ) ;
return err ;
} ;
return - EINVAL ;
}
/*
* Drop the packet on the floor
*/
2006-10-19 07:46:54 +04:00
static inline int ip6_pkt_drop ( struct sk_buff * skb , int code )
2005-04-17 02:20:36 +04:00
{
2006-08-29 11:00:47 +04:00
int type = ipv6_addr_type ( & skb - > nh . ipv6h - > daddr ) ;
if ( type = = IPV6_ADDR_ANY | | type = = IPV6_ADDR_RESERVED )
IP6_INC_STATS ( IPSTATS_MIB_INADDRERRORS ) ;
2005-04-17 02:20:36 +04:00
IP6_INC_STATS ( IPSTATS_MIB_OUTNOROUTES ) ;
2006-10-19 07:46:54 +04:00
icmpv6_send ( skb , ICMPV6_DEST_UNREACH , code , 0 , skb - > dev ) ;
2005-04-17 02:20:36 +04:00
kfree_skb ( skb ) ;
return 0 ;
}
2006-10-19 07:46:54 +04:00
static int ip6_pkt_discard ( struct sk_buff * skb )
{
return ip6_pkt_drop ( skb , ICMPV6_NOROUTE ) ;
}
2005-08-16 09:18:02 +04:00
static int ip6_pkt_discard_out ( struct sk_buff * skb )
2005-04-17 02:20:36 +04:00
{
skb - > dev = skb - > dst - > dev ;
return ip6_pkt_discard ( skb ) ;
}
2006-10-19 08:20:57 +04:00
# ifdef CONFIG_IPV6_MULTIPLE_TABLES
2006-10-19 07:46:54 +04:00
static int ip6_pkt_prohibit ( struct sk_buff * skb )
{
return ip6_pkt_drop ( skb , ICMPV6_ADM_PROHIBITED ) ;
}
static int ip6_pkt_prohibit_out ( struct sk_buff * skb )
{
skb - > dev = skb - > dst - > dev ;
return ip6_pkt_prohibit ( skb ) ;
}
static int ip6_pkt_blk_hole ( struct sk_buff * skb )
{
kfree_skb ( skb ) ;
return 0 ;
}
2006-10-19 08:20:57 +04:00
# endif
2005-04-17 02:20:36 +04:00
/*
* Allocate a dst for local ( unicast / anycast ) address .
*/
struct rt6_info * addrconf_dst_alloc ( struct inet6_dev * idev ,
const struct in6_addr * addr ,
int anycast )
{
struct rt6_info * rt = ip6_dst_alloc ( ) ;
if ( rt = = NULL )
return ERR_PTR ( - ENOMEM ) ;
dev_hold ( & loopback_dev ) ;
in6_dev_hold ( idev ) ;
rt - > u . dst . flags = DST_HOST ;
rt - > u . dst . input = ip6_input ;
rt - > u . dst . output = ip6_output ;
rt - > rt6i_dev = & loopback_dev ;
rt - > rt6i_idev = idev ;
rt - > u . dst . metrics [ RTAX_MTU - 1 ] = ipv6_get_mtu ( rt - > rt6i_dev ) ;
rt - > u . dst . metrics [ RTAX_ADVMSS - 1 ] = ipv6_advmss ( dst_mtu ( & rt - > u . dst ) ) ;
rt - > u . dst . metrics [ RTAX_HOPLIMIT - 1 ] = - 1 ;
rt - > u . dst . obsolete = - 1 ;
rt - > rt6i_flags = RTF_UP | RTF_NONEXTHOP ;
2005-12-21 16:56:42 +03:00
if ( anycast )
rt - > rt6i_flags | = RTF_ANYCAST ;
else
2005-04-17 02:20:36 +04:00
rt - > rt6i_flags | = RTF_LOCAL ;
rt - > rt6i_nexthop = ndisc_get_neigh ( rt - > rt6i_dev , & rt - > rt6i_gateway ) ;
if ( rt - > rt6i_nexthop = = NULL ) {
dst_free ( ( struct dst_entry * ) rt ) ;
return ERR_PTR ( - ENOMEM ) ;
}
ipv6_addr_copy ( & rt - > rt6i_dst . addr , addr ) ;
rt - > rt6i_dst . plen = 128 ;
2006-08-05 10:20:06 +04:00
rt - > rt6i_table = fib6_get_table ( RT6_TABLE_LOCAL ) ;
2005-04-17 02:20:36 +04:00
atomic_set ( & rt - > u . dst . __refcnt , 1 ) ;
return rt ;
}
static int fib6_ifdown ( struct rt6_info * rt , void * arg )
{
if ( ( ( void * ) rt - > rt6i_dev = = arg | | arg = = NULL ) & &
rt ! = & ip6_null_entry ) {
RT6_TRACE ( " deleted by ifdown %p \n " , rt ) ;
return - 1 ;
}
return 0 ;
}
void rt6_ifdown ( struct net_device * dev )
{
2006-08-05 10:20:06 +04:00
fib6_clean_all ( fib6_ifdown , 0 , dev ) ;
2005-04-17 02:20:36 +04:00
}
struct rt6_mtu_change_arg
{
struct net_device * dev ;
unsigned mtu ;
} ;
static int rt6_mtu_change_route ( struct rt6_info * rt , void * p_arg )
{
struct rt6_mtu_change_arg * arg = ( struct rt6_mtu_change_arg * ) p_arg ;
struct inet6_dev * idev ;
/* In IPv6 pmtu discovery is not optional,
so that RTAX_MTU lock cannot disable it .
We still use this lock to block changes
caused by addrconf / ndisc .
*/
idev = __in6_dev_get ( arg - > dev ) ;
if ( idev = = NULL )
return 0 ;
/* For administrative MTU increase, there is no way to discover
IPv6 PMTU increase , so PMTU increase should be updated here .
Since RFC 1981 doesn ' t include administrative MTU increase
update PMTU increase is a MUST . ( i . e . jumbo frame )
*/
/*
If new MTU is less than route PMTU , this new MTU will be the
lowest MTU in the path , update the route PMTU to reflect PMTU
decreases ; if new MTU is greater than route PMTU , and the
old MTU is the lowest MTU in the path , update the route PMTU
to reflect the increase . In this case if the other nodes ' MTU
also have the lowest MTU , TOO BIG MESSAGE will be lead to
PMTU discouvery .
*/
if ( rt - > rt6i_dev = = arg - > dev & &
! dst_metric_locked ( & rt - > u . dst , RTAX_MTU ) & &
( dst_mtu ( & rt - > u . dst ) > arg - > mtu | |
( dst_mtu ( & rt - > u . dst ) < arg - > mtu & &
dst_mtu ( & rt - > u . dst ) = = idev - > cnf . mtu6 ) ) )
rt - > u . dst . metrics [ RTAX_MTU - 1 ] = arg - > mtu ;
rt - > u . dst . metrics [ RTAX_ADVMSS - 1 ] = ipv6_advmss ( arg - > mtu ) ;
return 0 ;
}
void rt6_mtu_change ( struct net_device * dev , unsigned mtu )
{
2006-08-05 10:20:06 +04:00
struct rt6_mtu_change_arg arg = {
. dev = dev ,
. mtu = mtu ,
} ;
2005-04-17 02:20:36 +04:00
2006-08-05 10:20:06 +04:00
fib6_clean_all ( rt6_mtu_change_route , 0 , & arg ) ;
2005-04-17 02:20:36 +04:00
}
2006-08-22 11:01:08 +04:00
static struct nla_policy rtm_ipv6_policy [ RTA_MAX + 1 ] __read_mostly = {
2006-08-27 07:13:18 +04:00
[ RTA_GATEWAY ] = { . len = sizeof ( struct in6_addr ) } ,
2006-08-22 11:01:08 +04:00
[ RTA_OIF ] = { . type = NLA_U32 } ,
2006-08-22 11:01:47 +04:00
[ RTA_IIF ] = { . type = NLA_U32 } ,
2006-08-22 11:01:08 +04:00
[ RTA_PRIORITY ] = { . type = NLA_U32 } ,
[ RTA_METRICS ] = { . type = NLA_NESTED } ,
} ;
static int rtm_to_fib6_config ( struct sk_buff * skb , struct nlmsghdr * nlh ,
struct fib6_config * cfg )
2005-04-17 02:20:36 +04:00
{
2006-08-22 11:01:08 +04:00
struct rtmsg * rtm ;
struct nlattr * tb [ RTA_MAX + 1 ] ;
int err ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
err = nlmsg_parse ( nlh , sizeof ( * rtm ) , tb , RTA_MAX , rtm_ipv6_policy ) ;
if ( err < 0 )
goto errout ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
err = - EINVAL ;
rtm = nlmsg_data ( nlh ) ;
memset ( cfg , 0 , sizeof ( * cfg ) ) ;
cfg - > fc_table = rtm - > rtm_table ;
cfg - > fc_dst_len = rtm - > rtm_dst_len ;
cfg - > fc_src_len = rtm - > rtm_src_len ;
cfg - > fc_flags = RTF_UP ;
cfg - > fc_protocol = rtm - > rtm_protocol ;
if ( rtm - > rtm_type = = RTN_UNREACHABLE )
cfg - > fc_flags | = RTF_REJECT ;
cfg - > fc_nlinfo . pid = NETLINK_CB ( skb ) . pid ;
cfg - > fc_nlinfo . nlh = nlh ;
if ( tb [ RTA_GATEWAY ] ) {
nla_memcpy ( & cfg - > fc_gateway , tb [ RTA_GATEWAY ] , 16 ) ;
cfg - > fc_flags | = RTF_GATEWAY ;
2005-04-17 02:20:36 +04:00
}
2006-08-22 11:01:08 +04:00
if ( tb [ RTA_DST ] ) {
int plen = ( rtm - > rtm_dst_len + 7 ) > > 3 ;
if ( nla_len ( tb [ RTA_DST ] ) < plen )
goto errout ;
nla_memcpy ( & cfg - > fc_dst , tb [ RTA_DST ] , plen ) ;
2005-04-17 02:20:36 +04:00
}
2006-08-22 11:01:08 +04:00
if ( tb [ RTA_SRC ] ) {
int plen = ( rtm - > rtm_src_len + 7 ) > > 3 ;
if ( nla_len ( tb [ RTA_SRC ] ) < plen )
goto errout ;
nla_memcpy ( & cfg - > fc_src , tb [ RTA_SRC ] , plen ) ;
2005-04-17 02:20:36 +04:00
}
2006-08-22 11:01:08 +04:00
if ( tb [ RTA_OIF ] )
cfg - > fc_ifindex = nla_get_u32 ( tb [ RTA_OIF ] ) ;
if ( tb [ RTA_PRIORITY ] )
cfg - > fc_metric = nla_get_u32 ( tb [ RTA_PRIORITY ] ) ;
if ( tb [ RTA_METRICS ] ) {
cfg - > fc_mx = nla_data ( tb [ RTA_METRICS ] ) ;
cfg - > fc_mx_len = nla_len ( tb [ RTA_METRICS ] ) ;
2005-04-17 02:20:36 +04:00
}
2006-08-22 11:01:08 +04:00
if ( tb [ RTA_TABLE ] )
cfg - > fc_table = nla_get_u32 ( tb [ RTA_TABLE ] ) ;
err = 0 ;
errout :
return err ;
2005-04-17 02:20:36 +04:00
}
int inet6_rtm_delroute ( struct sk_buff * skb , struct nlmsghdr * nlh , void * arg )
{
2006-08-22 11:01:08 +04:00
struct fib6_config cfg ;
int err ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
err = rtm_to_fib6_config ( skb , nlh , & cfg ) ;
if ( err < 0 )
return err ;
return ip6_route_del ( & cfg ) ;
2005-04-17 02:20:36 +04:00
}
int inet6_rtm_newroute ( struct sk_buff * skb , struct nlmsghdr * nlh , void * arg )
{
2006-08-22 11:01:08 +04:00
struct fib6_config cfg ;
int err ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:08 +04:00
err = rtm_to_fib6_config ( skb , nlh , & cfg ) ;
if ( err < 0 )
return err ;
return ip6_route_add ( & cfg ) ;
2005-04-17 02:20:36 +04:00
}
static int rt6_fill_node ( struct sk_buff * skb , struct rt6_info * rt ,
2005-06-22 00:51:04 +04:00
struct in6_addr * dst , struct in6_addr * src ,
int iif , int type , u32 pid , u32 seq ,
int prefix , unsigned int flags )
2005-04-17 02:20:36 +04:00
{
struct rtmsg * rtm ;
2006-08-22 11:01:27 +04:00
struct nlmsghdr * nlh ;
2005-04-17 02:20:36 +04:00
struct rta_cacheinfo ci ;
2006-08-11 10:09:48 +04:00
u32 table ;
2005-04-17 02:20:36 +04:00
if ( prefix ) { /* user wants prefix routes only */
if ( ! ( rt - > rt6i_flags & RTF_PREFIX_RT ) ) {
/* success since this is not a prefix route */
return 1 ;
}
}
2006-08-22 11:01:27 +04:00
nlh = nlmsg_put ( skb , pid , seq , type , sizeof ( * rtm ) , flags ) ;
if ( nlh = = NULL )
return - ENOBUFS ;
rtm = nlmsg_data ( nlh ) ;
2005-04-17 02:20:36 +04:00
rtm - > rtm_family = AF_INET6 ;
rtm - > rtm_dst_len = rt - > rt6i_dst . plen ;
rtm - > rtm_src_len = rt - > rt6i_src . plen ;
rtm - > rtm_tos = 0 ;
2006-08-05 10:20:06 +04:00
if ( rt - > rt6i_table )
2006-08-11 10:09:48 +04:00
table = rt - > rt6i_table - > tb6_id ;
2006-08-05 10:20:06 +04:00
else
2006-08-11 10:09:48 +04:00
table = RT6_TABLE_UNSPEC ;
rtm - > rtm_table = table ;
2006-08-22 11:01:27 +04:00
NLA_PUT_U32 ( skb , RTA_TABLE , table ) ;
2005-04-17 02:20:36 +04:00
if ( rt - > rt6i_flags & RTF_REJECT )
rtm - > rtm_type = RTN_UNREACHABLE ;
else if ( rt - > rt6i_dev & & ( rt - > rt6i_dev - > flags & IFF_LOOPBACK ) )
rtm - > rtm_type = RTN_LOCAL ;
else
rtm - > rtm_type = RTN_UNICAST ;
rtm - > rtm_flags = 0 ;
rtm - > rtm_scope = RT_SCOPE_UNIVERSE ;
rtm - > rtm_protocol = rt - > rt6i_protocol ;
if ( rt - > rt6i_flags & RTF_DYNAMIC )
rtm - > rtm_protocol = RTPROT_REDIRECT ;
else if ( rt - > rt6i_flags & RTF_ADDRCONF )
rtm - > rtm_protocol = RTPROT_KERNEL ;
else if ( rt - > rt6i_flags & RTF_DEFAULT )
rtm - > rtm_protocol = RTPROT_RA ;
if ( rt - > rt6i_flags & RTF_CACHE )
rtm - > rtm_flags | = RTM_F_CLONED ;
if ( dst ) {
2006-08-22 11:01:27 +04:00
NLA_PUT ( skb , RTA_DST , 16 , dst ) ;
2005-04-17 02:20:36 +04:00
rtm - > rtm_dst_len = 128 ;
} else if ( rtm - > rtm_dst_len )
2006-08-22 11:01:27 +04:00
NLA_PUT ( skb , RTA_DST , 16 , & rt - > rt6i_dst . addr ) ;
2005-04-17 02:20:36 +04:00
# ifdef CONFIG_IPV6_SUBTREES
if ( src ) {
2006-08-22 11:01:27 +04:00
NLA_PUT ( skb , RTA_SRC , 16 , src ) ;
2005-04-17 02:20:36 +04:00
rtm - > rtm_src_len = 128 ;
} else if ( rtm - > rtm_src_len )
2006-08-22 11:01:27 +04:00
NLA_PUT ( skb , RTA_SRC , 16 , & rt - > rt6i_src . addr ) ;
2005-04-17 02:20:36 +04:00
# endif
if ( iif )
2006-08-22 11:01:27 +04:00
NLA_PUT_U32 ( skb , RTA_IIF , iif ) ;
2005-04-17 02:20:36 +04:00
else if ( dst ) {
struct in6_addr saddr_buf ;
if ( ipv6_get_saddr ( & rt - > u . dst , dst , & saddr_buf ) = = 0 )
2006-08-22 11:01:27 +04:00
NLA_PUT ( skb , RTA_PREFSRC , 16 , & saddr_buf ) ;
2005-04-17 02:20:36 +04:00
}
2006-08-22 11:01:27 +04:00
2005-04-17 02:20:36 +04:00
if ( rtnetlink_put_metrics ( skb , rt - > u . dst . metrics ) < 0 )
2006-08-22 11:01:27 +04:00
goto nla_put_failure ;
2005-04-17 02:20:36 +04:00
if ( rt - > u . dst . neighbour )
2006-08-22 11:01:27 +04:00
NLA_PUT ( skb , RTA_GATEWAY , 16 , & rt - > u . dst . neighbour - > primary_key ) ;
2005-04-17 02:20:36 +04:00
if ( rt - > u . dst . dev )
2006-08-22 11:01:27 +04:00
NLA_PUT_U32 ( skb , RTA_OIF , rt - > rt6i_dev - > ifindex ) ;
NLA_PUT_U32 ( skb , RTA_PRIORITY , rt - > rt6i_metric ) ;
2005-04-17 02:20:36 +04:00
ci . rta_lastuse = jiffies_to_clock_t ( jiffies - rt - > u . dst . lastuse ) ;
if ( rt - > rt6i_expires )
ci . rta_expires = jiffies_to_clock_t ( rt - > rt6i_expires - jiffies ) ;
else
ci . rta_expires = 0 ;
ci . rta_used = rt - > u . dst . __use ;
ci . rta_clntref = atomic_read ( & rt - > u . dst . __refcnt ) ;
ci . rta_error = rt - > u . dst . error ;
ci . rta_id = 0 ;
ci . rta_ts = 0 ;
ci . rta_tsage = 0 ;
2006-08-22 11:01:27 +04:00
NLA_PUT ( skb , RTA_CACHEINFO , sizeof ( ci ) , & ci ) ;
return nlmsg_end ( skb , nlh ) ;
nla_put_failure :
return nlmsg_cancel ( skb , nlh ) ;
2005-04-17 02:20:36 +04:00
}
2006-08-11 10:11:17 +04:00
int rt6_dump_route ( struct rt6_info * rt , void * p_arg )
2005-04-17 02:20:36 +04:00
{
struct rt6_rtnl_dump_arg * arg = ( struct rt6_rtnl_dump_arg * ) p_arg ;
int prefix ;
2006-08-22 11:01:27 +04:00
if ( nlmsg_len ( arg - > cb - > nlh ) > = sizeof ( struct rtmsg ) ) {
struct rtmsg * rtm = nlmsg_data ( arg - > cb - > nlh ) ;
2005-04-17 02:20:36 +04:00
prefix = ( rtm - > rtm_flags & RTM_F_PREFIX ) ! = 0 ;
} else
prefix = 0 ;
return rt6_fill_node ( arg - > skb , rt , NULL , NULL , 0 , RTM_NEWROUTE ,
NETLINK_CB ( arg - > cb - > skb ) . pid , arg - > cb - > nlh - > nlmsg_seq ,
2005-06-22 00:51:04 +04:00
prefix , NLM_F_MULTI ) ;
2005-04-17 02:20:36 +04:00
}
int inet6_rtm_getroute ( struct sk_buff * in_skb , struct nlmsghdr * nlh , void * arg )
{
2006-08-22 11:01:47 +04:00
struct nlattr * tb [ RTA_MAX + 1 ] ;
struct rt6_info * rt ;
2005-04-17 02:20:36 +04:00
struct sk_buff * skb ;
2006-08-22 11:01:47 +04:00
struct rtmsg * rtm ;
2005-04-17 02:20:36 +04:00
struct flowi fl ;
2006-08-22 11:01:47 +04:00
int err , iif = 0 ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:47 +04:00
err = nlmsg_parse ( nlh , sizeof ( * rtm ) , tb , RTA_MAX , rtm_ipv6_policy ) ;
if ( err < 0 )
goto errout ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:47 +04:00
err = - EINVAL ;
2005-04-17 02:20:36 +04:00
memset ( & fl , 0 , sizeof ( fl ) ) ;
2006-08-22 11:01:47 +04:00
if ( tb [ RTA_SRC ] ) {
if ( nla_len ( tb [ RTA_SRC ] ) < sizeof ( struct in6_addr ) )
goto errout ;
ipv6_addr_copy ( & fl . fl6_src , nla_data ( tb [ RTA_SRC ] ) ) ;
}
if ( tb [ RTA_DST ] ) {
if ( nla_len ( tb [ RTA_DST ] ) < sizeof ( struct in6_addr ) )
goto errout ;
ipv6_addr_copy ( & fl . fl6_dst , nla_data ( tb [ RTA_DST ] ) ) ;
}
if ( tb [ RTA_IIF ] )
iif = nla_get_u32 ( tb [ RTA_IIF ] ) ;
if ( tb [ RTA_OIF ] )
fl . oif = nla_get_u32 ( tb [ RTA_OIF ] ) ;
2005-04-17 02:20:36 +04:00
if ( iif ) {
struct net_device * dev ;
dev = __dev_get_by_index ( iif ) ;
if ( ! dev ) {
err = - ENODEV ;
2006-08-22 11:01:47 +04:00
goto errout ;
2005-04-17 02:20:36 +04:00
}
}
2006-08-22 11:01:47 +04:00
skb = alloc_skb ( NLMSG_GOODSIZE , GFP_KERNEL ) ;
if ( skb = = NULL ) {
err = - ENOBUFS ;
goto errout ;
}
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:47 +04:00
/* Reserve room for dummy headers, this skb can pass
through good chunk of routing engine .
*/
skb - > mac . raw = skb - > data ;
skb_reserve ( skb , MAX_HEADER + sizeof ( struct ipv6hdr ) ) ;
2005-04-17 02:20:36 +04:00
2006-08-22 11:01:47 +04:00
rt = ( struct rt6_info * ) ip6_route_output ( NULL , & fl ) ;
2005-04-17 02:20:36 +04:00
skb - > dst = & rt - > u . dst ;
2006-08-22 11:01:47 +04:00
err = rt6_fill_node ( skb , rt , & fl . fl6_dst , & fl . fl6_src , iif ,
2005-04-17 02:20:36 +04:00
RTM_NEWROUTE , NETLINK_CB ( in_skb ) . pid ,
2005-06-22 00:51:04 +04:00
nlh - > nlmsg_seq , 0 , 0 ) ;
2005-04-17 02:20:36 +04:00
if ( err < 0 ) {
2006-08-22 11:01:47 +04:00
kfree_skb ( skb ) ;
goto errout ;
2005-04-17 02:20:36 +04:00
}
2006-08-15 11:30:25 +04:00
err = rtnl_unicast ( skb , NETLINK_CB ( in_skb ) . pid ) ;
2006-08-22 11:01:47 +04:00
errout :
2005-04-17 02:20:36 +04:00
return err ;
}
2006-08-22 11:01:08 +04:00
void inet6_rt_notify ( int event , struct rt6_info * rt , struct nl_info * info )
2005-04-17 02:20:36 +04:00
{
struct sk_buff * skb ;
2006-08-22 11:01:08 +04:00
u32 pid = 0 , seq = 0 ;
struct nlmsghdr * nlh = NULL ;
2006-08-15 11:35:24 +04:00
int payload = sizeof ( struct rtmsg ) + 256 ;
int err = - ENOBUFS ;
2006-08-22 11:01:08 +04:00
if ( info ) {
pid = info - > pid ;
nlh = info - > nlh ;
if ( nlh )
seq = nlh - > nlmsg_seq ;
}
2006-08-15 11:35:24 +04:00
skb = nlmsg_new ( nlmsg_total_size ( payload ) , gfp_any ( ) ) ;
if ( skb = = NULL )
goto errout ;
err = rt6_fill_node ( skb , rt , NULL , NULL , 0 , event , pid , seq , 0 , 0 ) ;
if ( err < 0 ) {
2005-04-17 02:20:36 +04:00
kfree_skb ( skb ) ;
2006-08-15 11:35:24 +04:00
goto errout ;
2005-04-17 02:20:36 +04:00
}
2006-08-15 11:35:24 +04:00
err = rtnl_notify ( skb , pid , RTNLGRP_IPV6_ROUTE , nlh , gfp_any ( ) ) ;
errout :
if ( err < 0 )
rtnl_set_sk_err ( RTNLGRP_IPV6_ROUTE , err ) ;
2005-04-17 02:20:36 +04:00
}
/*
* / proc
*/
# ifdef CONFIG_PROC_FS
# define RT6_INFO_LEN (32 + 4 + 32 + 4 + 32 + 40 + 5 + 1)
struct rt6_proc_arg
{
char * buffer ;
int offset ;
int length ;
int skip ;
int len ;
} ;
static int rt6_info_route ( struct rt6_info * rt , void * p_arg )
{
struct rt6_proc_arg * arg = ( struct rt6_proc_arg * ) p_arg ;
int i ;
if ( arg - > skip < arg - > offset / RT6_INFO_LEN ) {
arg - > skip + + ;
return 0 ;
}
if ( arg - > len > = arg - > length )
return 0 ;
for ( i = 0 ; i < 16 ; i + + ) {
sprintf ( arg - > buffer + arg - > len , " %02x " ,
rt - > rt6i_dst . addr . s6_addr [ i ] ) ;
arg - > len + = 2 ;
}
arg - > len + = sprintf ( arg - > buffer + arg - > len , " %02x " ,
rt - > rt6i_dst . plen ) ;
# ifdef CONFIG_IPV6_SUBTREES
for ( i = 0 ; i < 16 ; i + + ) {
sprintf ( arg - > buffer + arg - > len , " %02x " ,
rt - > rt6i_src . addr . s6_addr [ i ] ) ;
arg - > len + = 2 ;
}
arg - > len + = sprintf ( arg - > buffer + arg - > len , " %02x " ,
rt - > rt6i_src . plen ) ;
# else
sprintf ( arg - > buffer + arg - > len ,
" 00000000000000000000000000000000 00 " ) ;
arg - > len + = 36 ;
# endif
if ( rt - > rt6i_nexthop ) {
for ( i = 0 ; i < 16 ; i + + ) {
sprintf ( arg - > buffer + arg - > len , " %02x " ,
rt - > rt6i_nexthop - > primary_key [ i ] ) ;
arg - > len + = 2 ;
}
} else {
sprintf ( arg - > buffer + arg - > len ,
" 00000000000000000000000000000000 " ) ;
arg - > len + = 32 ;
}
arg - > len + = sprintf ( arg - > buffer + arg - > len ,
" %08x %08x %08x %08x %8s \n " ,
rt - > rt6i_metric , atomic_read ( & rt - > u . dst . __refcnt ) ,
rt - > u . dst . __use , rt - > rt6i_flags ,
rt - > rt6i_dev ? rt - > rt6i_dev - > name : " " ) ;
return 0 ;
}
static int rt6_proc_info ( char * buffer , char * * start , off_t offset , int length )
{
2006-08-05 10:20:06 +04:00
struct rt6_proc_arg arg = {
. buffer = buffer ,
. offset = offset ,
. length = length ,
} ;
2005-04-17 02:20:36 +04:00
2006-08-05 10:20:06 +04:00
fib6_clean_all ( rt6_info_route , 0 , & arg ) ;
2005-04-17 02:20:36 +04:00
* start = buffer ;
if ( offset )
* start + = offset % RT6_INFO_LEN ;
arg . len - = offset % RT6_INFO_LEN ;
if ( arg . len > length )
arg . len = length ;
if ( arg . len < 0 )
arg . len = 0 ;
return arg . len ;
}
static int rt6_stats_seq_show ( struct seq_file * seq , void * v )
{
seq_printf ( seq , " %04x %04x %04x %04x %04x %04x %04x \n " ,
rt6_stats . fib_nodes , rt6_stats . fib_route_nodes ,
rt6_stats . fib_rt_alloc , rt6_stats . fib_rt_entries ,
rt6_stats . fib_rt_cache ,
atomic_read ( & ip6_dst_ops . entries ) ,
rt6_stats . fib_discarded_routes ) ;
return 0 ;
}
static int rt6_stats_seq_open ( struct inode * inode , struct file * file )
{
return single_open ( file , rt6_stats_seq_show , NULL ) ;
}
static struct file_operations rt6_stats_seq_fops = {
. owner = THIS_MODULE ,
. open = rt6_stats_seq_open ,
. read = seq_read ,
. llseek = seq_lseek ,
. release = single_release ,
} ;
# endif /* CONFIG_PROC_FS */
# ifdef CONFIG_SYSCTL
static int flush_delay ;
static
int ipv6_sysctl_rtcache_flush ( ctl_table * ctl , int write , struct file * filp ,
void __user * buffer , size_t * lenp , loff_t * ppos )
{
if ( write ) {
proc_dointvec ( ctl , write , filp , buffer , lenp , ppos ) ;
fib6_run_gc ( flush_delay < = 0 ? ~ 0UL : ( unsigned long ) flush_delay ) ;
return 0 ;
} else
return - EINVAL ;
}
ctl_table ipv6_route_table [ ] = {
{
. ctl_name = NET_IPV6_ROUTE_FLUSH ,
. procname = " flush " ,
. data = & flush_delay ,
. maxlen = sizeof ( int ) ,
2005-04-28 23:11:49 +04:00
. mode = 0200 ,
2005-04-17 02:20:36 +04:00
. proc_handler = & ipv6_sysctl_rtcache_flush
} ,
{
. ctl_name = NET_IPV6_ROUTE_GC_THRESH ,
. procname = " gc_thresh " ,
. data = & ip6_dst_ops . gc_thresh ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec ,
} ,
{
. ctl_name = NET_IPV6_ROUTE_MAX_SIZE ,
. procname = " max_size " ,
. data = & ip6_rt_max_size ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec ,
} ,
{
. ctl_name = NET_IPV6_ROUTE_GC_MIN_INTERVAL ,
. procname = " gc_min_interval " ,
. data = & ip6_rt_gc_min_interval ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_jiffies ,
. strategy = & sysctl_jiffies ,
} ,
{
. ctl_name = NET_IPV6_ROUTE_GC_TIMEOUT ,
. procname = " gc_timeout " ,
. data = & ip6_rt_gc_timeout ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_jiffies ,
. strategy = & sysctl_jiffies ,
} ,
{
. ctl_name = NET_IPV6_ROUTE_GC_INTERVAL ,
. procname = " gc_interval " ,
. data = & ip6_rt_gc_interval ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_jiffies ,
. strategy = & sysctl_jiffies ,
} ,
{
. ctl_name = NET_IPV6_ROUTE_GC_ELASTICITY ,
. procname = " gc_elasticity " ,
. data = & ip6_rt_gc_elasticity ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_jiffies ,
. strategy = & sysctl_jiffies ,
} ,
{
. ctl_name = NET_IPV6_ROUTE_MTU_EXPIRES ,
. procname = " mtu_expires " ,
. data = & ip6_rt_mtu_expires ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_jiffies ,
. strategy = & sysctl_jiffies ,
} ,
{
. ctl_name = NET_IPV6_ROUTE_MIN_ADVMSS ,
. procname = " min_adv_mss " ,
. data = & ip6_rt_min_advmss ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_jiffies ,
. strategy = & sysctl_jiffies ,
} ,
{
. ctl_name = NET_IPV6_ROUTE_GC_MIN_INTERVAL_MS ,
. procname = " gc_min_interval_ms " ,
. data = & ip6_rt_gc_min_interval ,
. maxlen = sizeof ( int ) ,
. mode = 0644 ,
. proc_handler = & proc_dointvec_ms_jiffies ,
. strategy = & sysctl_ms_jiffies ,
} ,
{ . ctl_name = 0 }
} ;
# endif
void __init ip6_route_init ( void )
{
struct proc_dir_entry * p ;
2006-08-27 06:25:52 +04:00
ip6_dst_ops . kmem_cachep =
kmem_cache_create ( " ip6_dst_cache " , sizeof ( struct rt6_info ) , 0 ,
SLAB_HWCACHE_ALIGN | SLAB_PANIC , NULL , NULL ) ;
2005-04-17 02:20:36 +04:00
fib6_init ( ) ;
# ifdef CONFIG_PROC_FS
p = proc_net_create ( " ipv6_route " , 0 , rt6_proc_info ) ;
if ( p )
p - > owner = THIS_MODULE ;
proc_net_fops_create ( " rt6_stats " , S_IRUGO , & rt6_stats_seq_fops ) ;
# endif
# ifdef CONFIG_XFRM
xfrm6_init ( ) ;
# endif
2006-08-04 14:39:02 +04:00
# ifdef CONFIG_IPV6_MULTIPLE_TABLES
fib6_rules_init ( ) ;
# endif
2005-04-17 02:20:36 +04:00
}
void ip6_route_cleanup ( void )
{
2006-08-04 14:39:02 +04:00
# ifdef CONFIG_IPV6_MULTIPLE_TABLES
fib6_rules_cleanup ( ) ;
# endif
2005-04-17 02:20:36 +04:00
# ifdef CONFIG_PROC_FS
proc_net_remove ( " ipv6_route " ) ;
proc_net_remove ( " rt6_stats " ) ;
# endif
# ifdef CONFIG_XFRM
xfrm6_fini ( ) ;
# endif
rt6_ifdown ( NULL ) ;
fib6_gc_cleanup ( ) ;
kmem_cache_destroy ( ip6_dst_ops . kmem_cachep ) ;
}