2007-07-14 18:55:06 -07:00
/*
* Copyright ( c ) 2007 Patrick McHardy < kaber @ trash . net >
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of the GNU General Public License as
* published by the Free Software Foundation ; either version 2 of
* the License , or ( at your option ) any later version .
*
* The code this is based on carried the following copyright notice :
* - - -
* ( C ) Copyright 2001 - 2006
* Alex Zeffertt , Cambridge Broadband Ltd , ajz @ cambridgebroadband . com
* Re - worked by Ben Greear < greearb @ candelatech . com >
* - - -
*/
# include <linux/kernel.h>
# include <linux/types.h>
# include <linux/module.h>
# include <linux/init.h>
# include <linux/errno.h>
# include <linux/slab.h>
# include <linux/string.h>
2008-05-12 21:21:05 +02:00
# include <linux/rculist.h>
2007-07-14 18:55:06 -07:00
# include <linux/notifier.h>
# include <linux/netdevice.h>
# include <linux/etherdevice.h>
# include <linux/ethtool.h>
# include <linux/if_arp.h>
# include <linux/if_link.h>
# include <linux/if_macvlan.h>
# include <net/rtnetlink.h>
2009-11-26 06:07:10 +00:00
# include <net/xfrm.h>
2007-07-14 18:55:06 -07:00
# define MACVLAN_HASH_SIZE (1 << BITS_PER_BYTE)
struct macvlan_port {
struct net_device * dev ;
struct hlist_head vlan_hash [ MACVLAN_HASH_SIZE ] ;
struct list_head vlans ;
} ;
2009-11-17 08:53:49 +00:00
/**
* struct macvlan_rx_stats - MACVLAN percpu rx stats
* @ rx_packets : number of received packets
* @ rx_bytes : number of received bytes
* @ multicast : number of received multicast packets
* @ rx_errors : number of errors
*/
struct macvlan_rx_stats {
unsigned long rx_packets ;
unsigned long rx_bytes ;
unsigned long multicast ;
unsigned long rx_errors ;
} ;
2007-07-14 18:55:06 -07:00
struct macvlan_dev {
struct net_device * dev ;
struct list_head list ;
struct hlist_node hlist ;
struct macvlan_port * port ;
struct net_device * lowerdev ;
2009-11-17 08:53:49 +00:00
struct macvlan_rx_stats * rx_stats ;
2009-11-26 06:07:10 +00:00
enum macvlan_mode mode ;
2007-07-14 18:55:06 -07:00
} ;
static struct macvlan_dev * macvlan_hash_lookup ( const struct macvlan_port * port ,
const unsigned char * addr )
{
struct macvlan_dev * vlan ;
struct hlist_node * n ;
hlist_for_each_entry_rcu ( vlan , n , & port - > vlan_hash [ addr [ 5 ] ] , hlist ) {
2009-09-01 05:46:05 +00:00
if ( ! compare_ether_addr_64bits ( vlan - > dev - > dev_addr , addr ) )
2007-07-14 18:55:06 -07:00
return vlan ;
}
return NULL ;
}
2009-03-13 13:16:13 -07:00
static void macvlan_hash_add ( struct macvlan_dev * vlan )
{
struct macvlan_port * port = vlan - > port ;
const unsigned char * addr = vlan - > dev - > dev_addr ;
hlist_add_head_rcu ( & vlan - > hlist , & port - > vlan_hash [ addr [ 5 ] ] ) ;
}
static void macvlan_hash_del ( struct macvlan_dev * vlan )
{
hlist_del_rcu ( & vlan - > hlist ) ;
synchronize_rcu ( ) ;
}
static void macvlan_hash_change_addr ( struct macvlan_dev * vlan ,
const unsigned char * addr )
{
macvlan_hash_del ( vlan ) ;
/* Now that we are unhashed it is safe to change the device
* address without confusing packet delivery .
*/
memcpy ( vlan - > dev - > dev_addr , addr , ETH_ALEN ) ;
macvlan_hash_add ( vlan ) ;
}
static int macvlan_addr_busy ( const struct macvlan_port * port ,
const unsigned char * addr )
{
/* Test to see if the specified multicast address is
* currently in use by the underlying device or
* another macvlan .
*/
2009-09-01 05:46:05 +00:00
if ( ! compare_ether_addr_64bits ( port - > dev - > dev_addr , addr ) )
2009-03-13 13:16:13 -07:00
return 1 ;
if ( macvlan_hash_lookup ( port , addr ) )
return 1 ;
return 0 ;
}
2009-11-26 06:07:09 +00:00
static inline void macvlan_count_rx ( const struct macvlan_dev * vlan ,
unsigned int len , bool success ,
bool multicast )
{
struct macvlan_rx_stats * rx_stats ;
rx_stats = per_cpu_ptr ( vlan - > rx_stats , smp_processor_id ( ) ) ;
if ( likely ( success ) ) {
rx_stats - > rx_packets + + ; ;
rx_stats - > rx_bytes + = len ;
if ( multicast )
rx_stats - > multicast + + ;
} else {
rx_stats - > rx_errors + + ;
}
}
static int macvlan_broadcast_one ( struct sk_buff * skb , struct net_device * dev ,
2009-11-26 06:07:10 +00:00
const struct ethhdr * eth , bool local )
2009-11-26 06:07:09 +00:00
{
if ( ! skb )
return NET_RX_DROP ;
2009-11-26 06:07:10 +00:00
if ( local )
return dev_forward_skb ( dev , skb ) ;
2009-11-26 06:07:09 +00:00
skb - > dev = dev ;
if ( ! compare_ether_addr_64bits ( eth - > h_dest ,
dev - > broadcast ) )
skb - > pkt_type = PACKET_BROADCAST ;
else
skb - > pkt_type = PACKET_MULTICAST ;
return netif_rx ( skb ) ;
}
2007-07-14 18:55:06 -07:00
static void macvlan_broadcast ( struct sk_buff * skb ,
2009-11-26 06:07:10 +00:00
const struct macvlan_port * port ,
struct net_device * src ,
enum macvlan_mode mode )
2007-07-14 18:55:06 -07:00
{
const struct ethhdr * eth = eth_hdr ( skb ) ;
const struct macvlan_dev * vlan ;
struct hlist_node * n ;
struct sk_buff * nskb ;
unsigned int i ;
2009-11-26 06:07:09 +00:00
int err ;
2007-07-14 18:55:06 -07:00
2008-11-26 15:30:48 -08:00
if ( skb - > protocol = = htons ( ETH_P_PAUSE ) )
return ;
2007-07-14 18:55:06 -07:00
for ( i = 0 ; i < MACVLAN_HASH_SIZE ; i + + ) {
hlist_for_each_entry_rcu ( vlan , n , & port - > vlan_hash [ i ] , hlist ) {
2009-11-26 06:07:10 +00:00
if ( vlan - > dev = = src | | ! ( vlan - > mode & mode ) )
continue ;
2007-07-14 18:55:06 -07:00
nskb = skb_clone ( skb , GFP_ATOMIC ) ;
2009-11-26 06:07:10 +00:00
err = macvlan_broadcast_one ( nskb , vlan - > dev , eth ,
mode = = MACVLAN_MODE_BRIDGE ) ;
2009-11-26 06:07:09 +00:00
macvlan_count_rx ( vlan , skb - > len + ETH_HLEN ,
err = = NET_RX_SUCCESS , 1 ) ;
2007-07-14 18:55:06 -07:00
}
}
}
/* called under rcu_read_lock() from netif_receive_skb */
static struct sk_buff * macvlan_handle_frame ( struct sk_buff * skb )
{
const struct ethhdr * eth = eth_hdr ( skb ) ;
const struct macvlan_port * port ;
const struct macvlan_dev * vlan ;
2009-11-26 06:07:10 +00:00
const struct macvlan_dev * src ;
2007-07-14 18:55:06 -07:00
struct net_device * dev ;
2009-11-26 06:07:09 +00:00
unsigned int len ;
2007-07-14 18:55:06 -07:00
port = rcu_dereference ( skb - > dev - > macvlan_port ) ;
if ( port = = NULL )
return skb ;
if ( is_multicast_ether_addr ( eth - > h_dest ) ) {
2009-11-26 06:07:10 +00:00
src = macvlan_hash_lookup ( port , eth - > h_source ) ;
if ( ! src )
/* frame comes from an external address */
macvlan_broadcast ( skb , port , NULL ,
MACVLAN_MODE_PRIVATE |
MACVLAN_MODE_VEPA |
MACVLAN_MODE_BRIDGE ) ;
else if ( src - > mode = = MACVLAN_MODE_VEPA )
/* flood to everyone except source */
macvlan_broadcast ( skb , port , src - > dev ,
MACVLAN_MODE_VEPA |
MACVLAN_MODE_BRIDGE ) ;
else if ( src - > mode = = MACVLAN_MODE_BRIDGE )
/*
* flood only to VEPA ports , bridge ports
* already saw the frame on the way out .
*/
macvlan_broadcast ( skb , port , src - > dev ,
MACVLAN_MODE_VEPA ) ;
2007-07-14 18:55:06 -07:00
return skb ;
}
vlan = macvlan_hash_lookup ( port , eth - > h_dest ) ;
if ( vlan = = NULL )
return skb ;
dev = vlan - > dev ;
if ( unlikely ( ! ( dev - > flags & IFF_UP ) ) ) {
kfree_skb ( skb ) ;
return NULL ;
}
2009-11-26 06:07:09 +00:00
len = skb - > len + ETH_HLEN ;
2007-07-14 18:55:06 -07:00
skb = skb_share_check ( skb , GFP_ATOMIC ) ;
2009-11-26 06:07:09 +00:00
macvlan_count_rx ( vlan , len , skb ! = NULL , 0 ) ;
if ( ! skb )
2007-07-14 18:55:06 -07:00
return NULL ;
skb - > dev = dev ;
skb - > pkt_type = PACKET_HOST ;
netif_rx ( skb ) ;
return NULL ;
}
2009-11-26 06:07:10 +00:00
static int macvlan_queue_xmit ( struct sk_buff * skb , struct net_device * dev )
{
const struct macvlan_dev * vlan = netdev_priv ( dev ) ;
const struct macvlan_port * port = vlan - > port ;
const struct macvlan_dev * dest ;
if ( vlan - > mode = = MACVLAN_MODE_BRIDGE ) {
const struct ethhdr * eth = ( void * ) skb - > data ;
/* send to other bridge ports directly */
if ( is_multicast_ether_addr ( eth - > h_dest ) ) {
macvlan_broadcast ( skb , port , dev , MACVLAN_MODE_BRIDGE ) ;
goto xmit_world ;
}
dest = macvlan_hash_lookup ( port , eth - > h_dest ) ;
if ( dest & & dest - > mode = = MACVLAN_MODE_BRIDGE ) {
unsigned int length = skb - > len + ETH_HLEN ;
int ret = dev_forward_skb ( dest - > dev , skb ) ;
macvlan_count_rx ( dest , length ,
ret = = NET_RX_SUCCESS , 0 ) ;
return NET_XMIT_SUCCESS ;
}
}
xmit_world :
skb - > dev = vlan - > lowerdev ;
return dev_queue_xmit ( skb ) ;
}
2009-08-31 19:50:51 +00:00
static netdev_tx_t macvlan_start_xmit ( struct sk_buff * skb ,
struct net_device * dev )
2007-07-14 18:55:06 -07:00
{
2009-09-03 00:11:45 +00:00
int i = skb_get_queue_mapping ( skb ) ;
struct netdev_queue * txq = netdev_get_tx_queue ( dev , i ) ;
2007-07-14 18:55:06 -07:00
unsigned int len = skb - > len ;
int ret ;
2009-11-26 06:07:10 +00:00
ret = macvlan_queue_xmit ( skb , dev ) ;
2007-07-14 18:55:06 -07:00
if ( likely ( ret = = NET_XMIT_SUCCESS ) ) {
2009-09-03 00:11:45 +00:00
txq - > tx_packets + + ;
txq - > tx_bytes + = len ;
} else
txq - > tx_dropped + + ;
2009-11-10 06:14:24 +00:00
return ret ;
2007-07-14 18:55:06 -07:00
}
static int macvlan_hard_header ( struct sk_buff * skb , struct net_device * dev ,
2007-10-09 01:40:57 -07:00
unsigned short type , const void * daddr ,
const void * saddr , unsigned len )
2007-07-14 18:55:06 -07:00
{
const struct macvlan_dev * vlan = netdev_priv ( dev ) ;
struct net_device * lowerdev = vlan - > lowerdev ;
2007-10-09 01:36:32 -07:00
return dev_hard_header ( skb , lowerdev , type , daddr ,
saddr ? : dev - > dev_addr , len ) ;
2007-07-14 18:55:06 -07:00
}
2007-10-09 01:40:57 -07:00
static const struct header_ops macvlan_hard_header_ops = {
. create = macvlan_hard_header ,
. rebuild = eth_rebuild_header ,
. parse = eth_header_parse ,
. cache = eth_header_cache ,
. cache_update = eth_header_cache_update ,
} ;
2007-07-14 18:55:06 -07:00
static int macvlan_open ( struct net_device * dev )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
struct net_device * lowerdev = vlan - > lowerdev ;
int err ;
2009-03-13 13:16:13 -07:00
err = - EBUSY ;
if ( macvlan_addr_busy ( vlan - > port , dev - > dev_addr ) )
goto out ;
2009-05-22 23:22:17 +00:00
err = dev_unicast_add ( lowerdev , dev - > dev_addr ) ;
2007-07-14 18:55:06 -07:00
if ( err < 0 )
2008-07-14 20:57:07 -07:00
goto out ;
if ( dev - > flags & IFF_ALLMULTI ) {
err = dev_set_allmulti ( lowerdev , 1 ) ;
if ( err < 0 )
goto del_unicast ;
}
2009-03-13 13:16:13 -07:00
macvlan_hash_add ( vlan ) ;
2007-07-14 18:55:06 -07:00
return 0 ;
2008-07-14 20:57:07 -07:00
del_unicast :
2009-05-22 23:22:17 +00:00
dev_unicast_delete ( lowerdev , dev - > dev_addr ) ;
2008-07-14 20:57:07 -07:00
out :
return err ;
2007-07-14 18:55:06 -07:00
}
static int macvlan_stop ( struct net_device * dev )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
struct net_device * lowerdev = vlan - > lowerdev ;
dev_mc_unsync ( lowerdev , dev ) ;
if ( dev - > flags & IFF_ALLMULTI )
dev_set_allmulti ( lowerdev , - 1 ) ;
2009-05-22 23:22:17 +00:00
dev_unicast_delete ( lowerdev , dev - > dev_addr ) ;
2007-07-14 18:55:06 -07:00
2009-03-13 13:16:13 -07:00
macvlan_hash_del ( vlan ) ;
2007-07-14 18:55:06 -07:00
return 0 ;
}
2007-11-19 22:00:42 -08:00
static int macvlan_set_mac_address ( struct net_device * dev , void * p )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
struct net_device * lowerdev = vlan - > lowerdev ;
struct sockaddr * addr = p ;
int err ;
if ( ! is_valid_ether_addr ( addr - > sa_data ) )
return - EADDRNOTAVAIL ;
2009-03-13 13:16:13 -07:00
if ( ! ( dev - > flags & IFF_UP ) ) {
/* Just copy in the new address */
memcpy ( dev - > dev_addr , addr - > sa_data , ETH_ALEN ) ;
} else {
/* Rehash and update the device filters */
if ( macvlan_addr_busy ( vlan - > port , addr - > sa_data ) )
return - EBUSY ;
2007-11-19 22:00:42 -08:00
2009-05-22 23:22:17 +00:00
err = dev_unicast_add ( lowerdev , addr - > sa_data ) ;
if ( err )
2009-03-13 13:16:13 -07:00
return err ;
2007-11-19 22:00:42 -08:00
2009-05-22 23:22:17 +00:00
dev_unicast_delete ( lowerdev , dev - > dev_addr ) ;
2009-03-13 13:16:13 -07:00
macvlan_hash_change_addr ( vlan , addr - > sa_data ) ;
}
2007-11-19 22:00:42 -08:00
return 0 ;
}
2007-07-14 18:55:06 -07:00
static void macvlan_change_rx_flags ( struct net_device * dev , int change )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
struct net_device * lowerdev = vlan - > lowerdev ;
if ( change & IFF_ALLMULTI )
dev_set_allmulti ( lowerdev , dev - > flags & IFF_ALLMULTI ? 1 : - 1 ) ;
}
static void macvlan_set_multicast_list ( struct net_device * dev )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
dev_mc_sync ( vlan - > lowerdev , dev ) ;
}
static int macvlan_change_mtu ( struct net_device * dev , int new_mtu )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
if ( new_mtu < 68 | | vlan - > lowerdev - > mtu < new_mtu )
return - EINVAL ;
dev - > mtu = new_mtu ;
return 0 ;
}
/*
* macvlan network devices have devices nesting below it and are a special
* " super class " of normal network devices ; split their locks off into a
* separate class since they always nest .
*/
static struct lock_class_key macvlan_netdev_xmit_lock_key ;
2008-07-22 14:16:42 -07:00
static struct lock_class_key macvlan_netdev_addr_lock_key ;
2007-07-14 18:55:06 -07:00
# define MACVLAN_FEATURES \
( NETIF_F_SG | NETIF_F_ALL_CSUM | NETIF_F_HIGHDMA | NETIF_F_FRAGLIST | \
NETIF_F_GSO | NETIF_F_TSO | NETIF_F_UFO | NETIF_F_GSO_ROBUST | \
NETIF_F_TSO_ECN | NETIF_F_TSO6 )
# define MACVLAN_STATE_MASK \
( ( 1 < < __LINK_STATE_NOCARRIER ) | ( 1 < < __LINK_STATE_DORMANT ) )
2008-07-17 00:34:19 -07:00
static void macvlan_set_lockdep_class_one ( struct net_device * dev ,
struct netdev_queue * txq ,
void * _unused )
2008-07-08 23:13:53 -07:00
{
lockdep_set_class ( & txq - > _xmit_lock ,
& macvlan_netdev_xmit_lock_key ) ;
}
static void macvlan_set_lockdep_class ( struct net_device * dev )
{
2008-07-22 14:16:42 -07:00
lockdep_set_class ( & dev - > addr_list_lock ,
& macvlan_netdev_addr_lock_key ) ;
2008-07-17 00:34:19 -07:00
netdev_for_each_tx_queue ( dev , macvlan_set_lockdep_class_one , NULL ) ;
2008-07-08 23:13:53 -07:00
}
2007-07-14 18:55:06 -07:00
static int macvlan_init ( struct net_device * dev )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
const struct net_device * lowerdev = vlan - > lowerdev ;
dev - > state = ( dev - > state & ~ MACVLAN_STATE_MASK ) |
( lowerdev - > state & MACVLAN_STATE_MASK ) ;
dev - > features = lowerdev - > features & MACVLAN_FEATURES ;
2009-11-23 14:18:53 -08:00
dev - > gso_max_size = lowerdev - > gso_max_size ;
2007-07-14 18:55:06 -07:00
dev - > iflink = lowerdev - > ifindex ;
2009-06-10 09:55:02 +00:00
dev - > hard_header_len = lowerdev - > hard_header_len ;
2007-07-14 18:55:06 -07:00
2008-07-08 23:13:53 -07:00
macvlan_set_lockdep_class ( dev ) ;
2009-11-17 08:53:49 +00:00
vlan - > rx_stats = alloc_percpu ( struct macvlan_rx_stats ) ;
if ( ! vlan - > rx_stats )
return - ENOMEM ;
2007-07-14 18:55:06 -07:00
return 0 ;
}
2009-11-17 08:53:49 +00:00
static void macvlan_uninit ( struct net_device * dev )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
free_percpu ( vlan - > rx_stats ) ;
}
static struct net_device_stats * macvlan_dev_get_stats ( struct net_device * dev )
{
struct net_device_stats * stats = & dev - > stats ;
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
dev_txq_stats_fold ( dev , stats ) ;
if ( vlan - > rx_stats ) {
struct macvlan_rx_stats * p , rx = { 0 } ;
int i ;
for_each_possible_cpu ( i ) {
p = per_cpu_ptr ( vlan - > rx_stats , i ) ;
rx . rx_packets + = p - > rx_packets ;
rx . rx_bytes + = p - > rx_bytes ;
rx . rx_errors + = p - > rx_errors ;
rx . multicast + = p - > multicast ;
}
stats - > rx_packets = rx . rx_packets ;
stats - > rx_bytes = rx . rx_bytes ;
stats - > rx_errors = rx . rx_errors ;
stats - > rx_dropped = rx . rx_errors ;
stats - > multicast = rx . multicast ;
}
return stats ;
}
2007-07-14 18:55:06 -07:00
static void macvlan_ethtool_get_drvinfo ( struct net_device * dev ,
struct ethtool_drvinfo * drvinfo )
{
snprintf ( drvinfo - > driver , 32 , " macvlan " ) ;
snprintf ( drvinfo - > version , 32 , " 0.1 " ) ;
}
static u32 macvlan_ethtool_get_rx_csum ( struct net_device * dev )
{
const struct macvlan_dev * vlan = netdev_priv ( dev ) ;
2009-04-20 04:49:28 +00:00
return dev_ethtool_get_rx_csum ( vlan - > lowerdev ) ;
2007-07-14 18:55:06 -07:00
}
2008-10-29 15:31:53 -07:00
static int macvlan_ethtool_get_settings ( struct net_device * dev ,
struct ethtool_cmd * cmd )
{
const struct macvlan_dev * vlan = netdev_priv ( dev ) ;
2009-04-20 04:49:28 +00:00
return dev_ethtool_get_settings ( vlan - > lowerdev , cmd ) ;
2008-10-29 15:31:53 -07:00
}
static u32 macvlan_ethtool_get_flags ( struct net_device * dev )
{
const struct macvlan_dev * vlan = netdev_priv ( dev ) ;
2009-04-20 04:49:28 +00:00
return dev_ethtool_get_flags ( vlan - > lowerdev ) ;
2008-10-29 15:31:53 -07:00
}
2007-07-14 18:55:06 -07:00
static const struct ethtool_ops macvlan_ethtool_ops = {
. get_link = ethtool_op_get_link ,
2008-10-29 15:31:53 -07:00
. get_settings = macvlan_ethtool_get_settings ,
2007-07-14 18:55:06 -07:00
. get_rx_csum = macvlan_ethtool_get_rx_csum ,
. get_drvinfo = macvlan_ethtool_get_drvinfo ,
2008-10-29 15:31:53 -07:00
. get_flags = macvlan_ethtool_get_flags ,
2007-07-14 18:55:06 -07:00
} ;
2008-11-19 21:51:06 -08:00
static const struct net_device_ops macvlan_netdev_ops = {
. ndo_init = macvlan_init ,
2009-11-17 08:53:49 +00:00
. ndo_uninit = macvlan_uninit ,
2008-11-19 21:51:06 -08:00
. ndo_open = macvlan_open ,
. ndo_stop = macvlan_stop ,
2008-11-20 20:14:53 -08:00
. ndo_start_xmit = macvlan_start_xmit ,
2008-11-19 21:51:06 -08:00
. ndo_change_mtu = macvlan_change_mtu ,
. ndo_change_rx_flags = macvlan_change_rx_flags ,
. ndo_set_mac_address = macvlan_set_mac_address ,
. ndo_set_multicast_list = macvlan_set_multicast_list ,
2009-11-17 08:53:49 +00:00
. ndo_get_stats = macvlan_dev_get_stats ,
2008-11-19 21:51:06 -08:00
. ndo_validate_addr = eth_validate_addr ,
} ;
2007-07-14 18:55:06 -07:00
static void macvlan_setup ( struct net_device * dev )
{
ether_setup ( dev ) ;
net: release dst entry in dev_hard_start_xmit()
One point of contention in high network loads is the dst_release() performed
when a transmited skb is freed. This is because NIC tx completion calls
dev_kree_skb() long after original call to dev_queue_xmit(skb).
CPU cache is cold and the atomic op in dst_release() stalls. On SMP, this is
quite visible if one CPU is 100% handling softirqs for a network device,
since dst_clone() is done by other cpus, involving cache line ping pongs.
It seems right place to release dst is in dev_hard_start_xmit(), for most
devices but ones that are virtual, and some exceptions.
David Miller suggested to define a new device flag, set in alloc_netdev_mq()
(so that most devices set it at init time), and carefuly unset in devices
which dont want a NULL skb->dst in their ndo_start_xmit().
List of devices that must clear this flag is :
- loopback device, because it calls netif_rx() and quoting Patrick :
"ip_route_input() doesn't accept loopback addresses, so loopback packets
already need to have a dst_entry attached."
- appletalk/ipddp.c : needs skb->dst in its xmit function
- And all devices that call again dev_queue_xmit() from their xmit function
(as some classifiers need skb->dst) : bonding, vlan, macvlan, eql, ifb, hdlc_fr
Signed-off-by: Eric Dumazet <dada1@cosmosbay.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2009-05-18 22:19:19 -07:00
dev - > priv_flags & = ~ IFF_XMIT_DST_RELEASE ;
2008-11-19 21:51:06 -08:00
dev - > netdev_ops = & macvlan_netdev_ops ;
2007-07-14 18:55:06 -07:00
dev - > destructor = free_netdev ;
2007-10-09 01:40:57 -07:00
dev - > header_ops = & macvlan_hard_header_ops ,
2007-07-14 18:55:06 -07:00
dev - > ethtool_ops = & macvlan_ethtool_ops ;
dev - > tx_queue_len = 0 ;
}
static int macvlan_port_create ( struct net_device * dev )
{
struct macvlan_port * port ;
unsigned int i ;
if ( dev - > type ! = ARPHRD_ETHER | | dev - > flags & IFF_LOOPBACK )
return - EINVAL ;
port = kzalloc ( sizeof ( * port ) , GFP_KERNEL ) ;
if ( port = = NULL )
return - ENOMEM ;
port - > dev = dev ;
INIT_LIST_HEAD ( & port - > vlans ) ;
for ( i = 0 ; i < MACVLAN_HASH_SIZE ; i + + )
INIT_HLIST_HEAD ( & port - > vlan_hash [ i ] ) ;
rcu_assign_pointer ( dev - > macvlan_port , port ) ;
return 0 ;
}
static void macvlan_port_destroy ( struct net_device * dev )
{
struct macvlan_port * port = dev - > macvlan_port ;
rcu_assign_pointer ( dev - > macvlan_port , NULL ) ;
synchronize_rcu ( ) ;
kfree ( port ) ;
}
static int macvlan_validate ( struct nlattr * tb [ ] , struct nlattr * data [ ] )
{
if ( tb [ IFLA_ADDRESS ] ) {
if ( nla_len ( tb [ IFLA_ADDRESS ] ) ! = ETH_ALEN )
return - EINVAL ;
if ( ! is_valid_ether_addr ( nla_data ( tb [ IFLA_ADDRESS ] ) ) )
return - EADDRNOTAVAIL ;
}
2009-11-26 06:07:11 +00:00
if ( data & & data [ IFLA_MACVLAN_MODE ] ) {
switch ( nla_get_u32 ( data [ IFLA_MACVLAN_MODE ] ) ) {
case MACVLAN_MODE_PRIVATE :
case MACVLAN_MODE_VEPA :
case MACVLAN_MODE_BRIDGE :
break ;
default :
return - EINVAL ;
}
}
2007-07-14 18:55:06 -07:00
return 0 ;
}
2009-09-03 00:11:45 +00:00
static int macvlan_get_tx_queues ( struct net * net ,
struct nlattr * tb [ ] ,
unsigned int * num_tx_queues ,
unsigned int * real_num_tx_queues )
{
struct net_device * real_dev ;
if ( ! tb [ IFLA_LINK ] )
return - EINVAL ;
real_dev = __dev_get_by_index ( net , nla_get_u32 ( tb [ IFLA_LINK ] ) ) ;
if ( ! real_dev )
return - ENODEV ;
* num_tx_queues = real_dev - > num_tx_queues ;
* real_num_tx_queues = real_dev - > real_num_tx_queues ;
return 0 ;
}
2009-11-08 00:53:51 -08:00
static int macvlan_newlink ( struct net * src_net , struct net_device * dev ,
2007-07-14 18:55:06 -07:00
struct nlattr * tb [ ] , struct nlattr * data [ ] )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
struct macvlan_port * port ;
struct net_device * lowerdev ;
int err ;
if ( ! tb [ IFLA_LINK ] )
return - EINVAL ;
2009-11-08 00:53:51 -08:00
lowerdev = __dev_get_by_index ( src_net , nla_get_u32 ( tb [ IFLA_LINK ] ) ) ;
2007-07-14 18:55:06 -07:00
if ( lowerdev = = NULL )
return - ENODEV ;
2009-03-13 13:15:37 -07:00
/* When creating macvlans on top of other macvlans - use
* the real device as the lowerdev .
2008-01-10 22:39:28 -08:00
*/
2009-03-13 13:15:37 -07:00
if ( lowerdev - > rtnl_link_ops = = dev - > rtnl_link_ops ) {
struct macvlan_dev * lowervlan = netdev_priv ( lowerdev ) ;
lowerdev = lowervlan - > lowerdev ;
}
2008-01-10 22:39:28 -08:00
2007-07-14 18:55:06 -07:00
if ( ! tb [ IFLA_MTU ] )
dev - > mtu = lowerdev - > mtu ;
else if ( dev - > mtu > lowerdev - > mtu )
return - EINVAL ;
if ( ! tb [ IFLA_ADDRESS ] )
random_ether_addr ( dev - > dev_addr ) ;
if ( lowerdev - > macvlan_port = = NULL ) {
err = macvlan_port_create ( lowerdev ) ;
if ( err < 0 )
return err ;
}
port = lowerdev - > macvlan_port ;
vlan - > lowerdev = lowerdev ;
vlan - > dev = dev ;
vlan - > port = port ;
2009-11-26 06:07:11 +00:00
vlan - > mode = MACVLAN_MODE_VEPA ;
if ( data & & data [ IFLA_MACVLAN_MODE ] )
vlan - > mode = nla_get_u32 ( data [ IFLA_MACVLAN_MODE ] ) ;
2007-07-14 18:55:06 -07:00
err = register_netdevice ( dev ) ;
if ( err < 0 )
return err ;
list_add_tail ( & vlan - > list , & port - > vlans ) ;
2009-12-03 15:59:22 -08:00
netif_stacked_transfer_operstate ( lowerdev , dev ) ;
2007-07-14 18:55:06 -07:00
return 0 ;
}
2009-10-27 07:06:36 +00:00
static void macvlan_dellink ( struct net_device * dev , struct list_head * head )
2007-07-14 18:55:06 -07:00
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
struct macvlan_port * port = vlan - > port ;
list_del ( & vlan - > list ) ;
2009-10-27 07:06:36 +00:00
unregister_netdevice_queue ( dev , head ) ;
2007-07-14 18:55:06 -07:00
if ( list_empty ( & port - > vlans ) )
2008-05-08 01:13:31 -07:00
macvlan_port_destroy ( port - > dev ) ;
2007-07-14 18:55:06 -07:00
}
2009-11-26 06:07:11 +00:00
static int macvlan_changelink ( struct net_device * dev ,
struct nlattr * tb [ ] , struct nlattr * data [ ] )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
if ( data & & data [ IFLA_MACVLAN_MODE ] )
vlan - > mode = nla_get_u32 ( data [ IFLA_MACVLAN_MODE ] ) ;
return 0 ;
}
static size_t macvlan_get_size ( const struct net_device * dev )
{
return nla_total_size ( 4 ) ;
}
static int macvlan_fill_info ( struct sk_buff * skb ,
const struct net_device * dev )
{
struct macvlan_dev * vlan = netdev_priv ( dev ) ;
NLA_PUT_U32 ( skb , IFLA_MACVLAN_MODE , vlan - > mode ) ;
return 0 ;
nla_put_failure :
return - EMSGSIZE ;
}
static const struct nla_policy macvlan_policy [ IFLA_MACVLAN_MAX + 1 ] = {
[ IFLA_MACVLAN_MODE ] = { . type = NLA_U32 } ,
} ;
2007-07-14 18:55:06 -07:00
static struct rtnl_link_ops macvlan_link_ops __read_mostly = {
. kind = " macvlan " ,
. priv_size = sizeof ( struct macvlan_dev ) ,
2009-09-03 00:11:45 +00:00
. get_tx_queues = macvlan_get_tx_queues ,
2007-07-14 18:55:06 -07:00
. setup = macvlan_setup ,
. validate = macvlan_validate ,
. newlink = macvlan_newlink ,
. dellink = macvlan_dellink ,
2009-11-26 06:07:11 +00:00
. maxtype = IFLA_MACVLAN_MAX ,
. policy = macvlan_policy ,
. changelink = macvlan_changelink ,
. get_size = macvlan_get_size ,
. fill_info = macvlan_fill_info ,
2007-07-14 18:55:06 -07:00
} ;
static int macvlan_device_event ( struct notifier_block * unused ,
unsigned long event , void * ptr )
{
struct net_device * dev = ptr ;
struct macvlan_dev * vlan , * next ;
struct macvlan_port * port ;
port = dev - > macvlan_port ;
if ( port = = NULL )
return NOTIFY_DONE ;
switch ( event ) {
case NETDEV_CHANGE :
list_for_each_entry ( vlan , & port - > vlans , list )
2009-12-03 15:59:22 -08:00
netif_stacked_transfer_operstate ( vlan - > lowerdev ,
vlan - > dev ) ;
2007-07-14 18:55:06 -07:00
break ;
case NETDEV_FEAT_CHANGE :
list_for_each_entry ( vlan , & port - > vlans , list ) {
vlan - > dev - > features = dev - > features & MACVLAN_FEATURES ;
2009-11-23 14:18:53 -08:00
vlan - > dev - > gso_max_size = dev - > gso_max_size ;
2007-07-14 18:55:06 -07:00
netdev_features_change ( vlan - > dev ) ;
}
break ;
case NETDEV_UNREGISTER :
list_for_each_entry_safe ( vlan , next , & port - > vlans , list )
2009-10-27 07:06:36 +00:00
macvlan_dellink ( vlan - > dev , NULL ) ;
2007-07-14 18:55:06 -07:00
break ;
}
return NOTIFY_DONE ;
}
static struct notifier_block macvlan_notifier_block __read_mostly = {
. notifier_call = macvlan_device_event ,
} ;
static int __init macvlan_init_module ( void )
{
int err ;
register_netdevice_notifier ( & macvlan_notifier_block ) ;
macvlan_handle_frame_hook = macvlan_handle_frame ;
err = rtnl_link_register ( & macvlan_link_ops ) ;
if ( err < 0 )
goto err1 ;
return 0 ;
err1 :
2008-01-31 16:56:03 -08:00
macvlan_handle_frame_hook = NULL ;
2007-07-14 18:55:06 -07:00
unregister_netdevice_notifier ( & macvlan_notifier_block ) ;
return err ;
}
static void __exit macvlan_cleanup_module ( void )
{
rtnl_link_unregister ( & macvlan_link_ops ) ;
macvlan_handle_frame_hook = NULL ;
unregister_netdevice_notifier ( & macvlan_notifier_block ) ;
}
module_init ( macvlan_init_module ) ;
module_exit ( macvlan_cleanup_module ) ;
MODULE_LICENSE ( " GPL " ) ;
MODULE_AUTHOR ( " Patrick McHardy <kaber@trash.net> " ) ;
MODULE_DESCRIPTION ( " Driver for MAC address based VLANs " ) ;
MODULE_ALIAS_RTNL_LINK ( " macvlan " ) ;